{ "best_metric": null, "best_model_checkpoint": null, "epoch": 0.9999863453266881, "global_step": 36617, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 1.8198362147406737e-08, "loss": 2.9556, "step": 1 }, { "epoch": 0.0, "learning_rate": 3.639672429481347e-08, "loss": 3.2939, "step": 2 }, { "epoch": 0.0, "learning_rate": 5.4595086442220206e-08, "loss": 3.085, "step": 3 }, { "epoch": 0.0, "learning_rate": 7.279344858962695e-08, "loss": 2.96, "step": 4 }, { "epoch": 0.0, "learning_rate": 9.099181073703367e-08, "loss": 2.8887, "step": 5 }, { "epoch": 0.0, "learning_rate": 1.0919017288444041e-07, "loss": 2.75, "step": 6 }, { "epoch": 0.0, "learning_rate": 1.2738853503184715e-07, "loss": 2.9751, "step": 7 }, { "epoch": 0.0, "learning_rate": 1.455868971792539e-07, "loss": 3.0625, "step": 8 }, { "epoch": 0.0, "learning_rate": 1.637852593266606e-07, "loss": 3.1455, "step": 9 }, { "epoch": 0.0, "learning_rate": 1.8198362147406735e-07, "loss": 3.0293, "step": 10 }, { "epoch": 0.0, "learning_rate": 2.0018198362147409e-07, "loss": 2.9561, "step": 11 }, { "epoch": 0.0, "learning_rate": 2.1838034576888083e-07, "loss": 2.9434, "step": 12 }, { "epoch": 0.0, "learning_rate": 2.3657870791628754e-07, "loss": 3.0137, "step": 13 }, { "epoch": 0.0, "learning_rate": 2.547770700636943e-07, "loss": 2.6338, "step": 14 }, { "epoch": 0.0, "learning_rate": 2.72975432211101e-07, "loss": 3.1523, "step": 15 }, { "epoch": 0.0, "learning_rate": 2.911737943585078e-07, "loss": 3.1885, "step": 16 }, { "epoch": 0.0, "learning_rate": 3.0937215650591447e-07, "loss": 3.1484, "step": 17 }, { "epoch": 0.0, "learning_rate": 3.275705186533212e-07, "loss": 3.2451, "step": 18 }, { "epoch": 0.0, "learning_rate": 3.45768880800728e-07, "loss": 2.9922, "step": 19 }, { "epoch": 0.0, "learning_rate": 3.639672429481347e-07, "loss": 2.9766, "step": 20 }, { "epoch": 0.0, "learning_rate": 3.8216560509554143e-07, "loss": 3.1494, "step": 21 }, { "epoch": 0.0, "learning_rate": 4.0036396724294817e-07, "loss": 2.9111, "step": 22 }, { "epoch": 0.0, "learning_rate": 4.185623293903549e-07, "loss": 3.4326, "step": 23 }, { "epoch": 0.0, "learning_rate": 4.3676069153776165e-07, "loss": 2.9893, "step": 24 }, { "epoch": 0.0, "learning_rate": 4.5495905368516834e-07, "loss": 3.2588, "step": 25 }, { "epoch": 0.0, "learning_rate": 4.731574158325751e-07, "loss": 3.3096, "step": 26 }, { "epoch": 0.0, "learning_rate": 4.913557779799818e-07, "loss": 3.0918, "step": 27 }, { "epoch": 0.0, "learning_rate": 5.095541401273886e-07, "loss": 3.1191, "step": 28 }, { "epoch": 0.0, "learning_rate": 5.277525022747953e-07, "loss": 3.1475, "step": 29 }, { "epoch": 0.0, "learning_rate": 5.45950864422202e-07, "loss": 2.8135, "step": 30 }, { "epoch": 0.0, "learning_rate": 5.641492265696088e-07, "loss": 3.4014, "step": 31 }, { "epoch": 0.0, "learning_rate": 5.823475887170156e-07, "loss": 3.1582, "step": 32 }, { "epoch": 0.0, "learning_rate": 6.005459508644223e-07, "loss": 2.9453, "step": 33 }, { "epoch": 0.0, "learning_rate": 6.187443130118289e-07, "loss": 2.8589, "step": 34 }, { "epoch": 0.0, "learning_rate": 6.369426751592357e-07, "loss": 2.9805, "step": 35 }, { "epoch": 0.0, "learning_rate": 6.551410373066424e-07, "loss": 3.0605, "step": 36 }, { "epoch": 0.0, "learning_rate": 6.733393994540492e-07, "loss": 3.0625, "step": 37 }, { "epoch": 0.0, "learning_rate": 6.91537761601456e-07, "loss": 3.0059, "step": 38 }, { "epoch": 0.0, "learning_rate": 7.097361237488627e-07, "loss": 2.7793, "step": 39 }, { "epoch": 0.0, "learning_rate": 7.279344858962694e-07, "loss": 2.8896, "step": 40 }, { "epoch": 0.0, "learning_rate": 7.461328480436761e-07, "loss": 3.2939, "step": 41 }, { "epoch": 0.0, "learning_rate": 7.643312101910829e-07, "loss": 3.125, "step": 42 }, { "epoch": 0.0, "learning_rate": 7.825295723384895e-07, "loss": 2.8975, "step": 43 }, { "epoch": 0.0, "learning_rate": 8.007279344858963e-07, "loss": 3.3418, "step": 44 }, { "epoch": 0.0, "learning_rate": 8.189262966333031e-07, "loss": 3.0352, "step": 45 }, { "epoch": 0.0, "learning_rate": 8.371246587807098e-07, "loss": 3.375, "step": 46 }, { "epoch": 0.0, "learning_rate": 8.553230209281166e-07, "loss": 2.9277, "step": 47 }, { "epoch": 0.0, "learning_rate": 8.735213830755233e-07, "loss": 2.9033, "step": 48 }, { "epoch": 0.0, "learning_rate": 8.9171974522293e-07, "loss": 2.1895, "step": 49 }, { "epoch": 0.0, "learning_rate": 9.099181073703367e-07, "loss": 2.8555, "step": 50 }, { "epoch": 0.0, "learning_rate": 9.281164695177435e-07, "loss": 3.1128, "step": 51 }, { "epoch": 0.0, "learning_rate": 9.463148316651502e-07, "loss": 3.2158, "step": 52 }, { "epoch": 0.0, "learning_rate": 9.64513193812557e-07, "loss": 2.8691, "step": 53 }, { "epoch": 0.0, "learning_rate": 9.827115559599636e-07, "loss": 2.7725, "step": 54 }, { "epoch": 0.0, "learning_rate": 1.0009099181073705e-06, "loss": 2.8984, "step": 55 }, { "epoch": 0.0, "learning_rate": 1.0191082802547772e-06, "loss": 2.8135, "step": 56 }, { "epoch": 0.0, "learning_rate": 1.037306642402184e-06, "loss": 2.9434, "step": 57 }, { "epoch": 0.0, "learning_rate": 1.0555050045495906e-06, "loss": 2.957, "step": 58 }, { "epoch": 0.0, "learning_rate": 1.0737033666969973e-06, "loss": 2.915, "step": 59 }, { "epoch": 0.0, "learning_rate": 1.091901728844404e-06, "loss": 2.6943, "step": 60 }, { "epoch": 0.0, "learning_rate": 1.1101000909918109e-06, "loss": 2.7061, "step": 61 }, { "epoch": 0.0, "learning_rate": 1.1282984531392176e-06, "loss": 2.0957, "step": 62 }, { "epoch": 0.0, "learning_rate": 1.1464968152866242e-06, "loss": 2.8203, "step": 63 }, { "epoch": 0.0, "learning_rate": 1.1646951774340311e-06, "loss": 2.8955, "step": 64 }, { "epoch": 0.0, "learning_rate": 1.1828935395814378e-06, "loss": 2.9902, "step": 65 }, { "epoch": 0.0, "learning_rate": 1.2010919017288445e-06, "loss": 2.7168, "step": 66 }, { "epoch": 0.0, "learning_rate": 1.2192902638762512e-06, "loss": 2.7363, "step": 67 }, { "epoch": 0.0, "learning_rate": 1.2374886260236579e-06, "loss": 2.9766, "step": 68 }, { "epoch": 0.0, "learning_rate": 1.2556869881710648e-06, "loss": 2.9365, "step": 69 }, { "epoch": 0.0, "learning_rate": 1.2738853503184715e-06, "loss": 2.9634, "step": 70 }, { "epoch": 0.0, "learning_rate": 1.292083712465878e-06, "loss": 3.2402, "step": 71 }, { "epoch": 0.0, "learning_rate": 1.3102820746132848e-06, "loss": 2.6636, "step": 72 }, { "epoch": 0.0, "learning_rate": 1.3284804367606915e-06, "loss": 2.748, "step": 73 }, { "epoch": 0.0, "learning_rate": 1.3466787989080984e-06, "loss": 2.7373, "step": 74 }, { "epoch": 0.0, "learning_rate": 1.3648771610555051e-06, "loss": 2.7734, "step": 75 }, { "epoch": 0.0, "learning_rate": 1.383075523202912e-06, "loss": 2.1279, "step": 76 }, { "epoch": 0.0, "learning_rate": 1.4012738853503185e-06, "loss": 2.7324, "step": 77 }, { "epoch": 0.0, "learning_rate": 1.4194722474977254e-06, "loss": 3.0762, "step": 78 }, { "epoch": 0.0, "learning_rate": 1.437670609645132e-06, "loss": 2.8013, "step": 79 }, { "epoch": 0.0, "learning_rate": 1.4558689717925388e-06, "loss": 2.812, "step": 80 }, { "epoch": 0.0, "learning_rate": 1.4740673339399455e-06, "loss": 2.6143, "step": 81 }, { "epoch": 0.0, "learning_rate": 1.4922656960873521e-06, "loss": 2.8516, "step": 82 }, { "epoch": 0.0, "learning_rate": 1.510464058234759e-06, "loss": 2.5049, "step": 83 }, { "epoch": 0.0, "learning_rate": 1.5286624203821657e-06, "loss": 2.8105, "step": 84 }, { "epoch": 0.0, "learning_rate": 1.5468607825295726e-06, "loss": 2.873, "step": 85 }, { "epoch": 0.0, "learning_rate": 1.565059144676979e-06, "loss": 2.604, "step": 86 }, { "epoch": 0.0, "learning_rate": 1.583257506824386e-06, "loss": 2.8818, "step": 87 }, { "epoch": 0.0, "learning_rate": 1.6014558689717927e-06, "loss": 2.9258, "step": 88 }, { "epoch": 0.0, "learning_rate": 1.6196542311191994e-06, "loss": 2.6875, "step": 89 }, { "epoch": 0.0, "learning_rate": 1.6378525932666063e-06, "loss": 2.708, "step": 90 }, { "epoch": 0.0, "learning_rate": 1.6560509554140127e-06, "loss": 2.5981, "step": 91 }, { "epoch": 0.0, "learning_rate": 1.6742493175614196e-06, "loss": 2.6377, "step": 92 }, { "epoch": 0.0, "learning_rate": 1.6924476797088263e-06, "loss": 2.5674, "step": 93 }, { "epoch": 0.0, "learning_rate": 1.7106460418562332e-06, "loss": 2.376, "step": 94 }, { "epoch": 0.0, "learning_rate": 1.7288444040036397e-06, "loss": 2.5024, "step": 95 }, { "epoch": 0.0, "learning_rate": 1.7470427661510466e-06, "loss": 2.5527, "step": 96 }, { "epoch": 0.0, "learning_rate": 1.7652411282984533e-06, "loss": 2.0522, "step": 97 }, { "epoch": 0.0, "learning_rate": 1.78343949044586e-06, "loss": 2.3467, "step": 98 }, { "epoch": 0.0, "learning_rate": 1.8016378525932669e-06, "loss": 2.5283, "step": 99 }, { "epoch": 0.0, "learning_rate": 1.8198362147406733e-06, "loss": 2.583, "step": 100 }, { "epoch": 0.0, "learning_rate": 1.8380345768880802e-06, "loss": 2.6616, "step": 101 }, { "epoch": 0.0, "learning_rate": 1.856232939035487e-06, "loss": 2.4248, "step": 102 }, { "epoch": 0.0, "learning_rate": 1.8744313011828938e-06, "loss": 2.6797, "step": 103 }, { "epoch": 0.0, "learning_rate": 1.8926296633303003e-06, "loss": 2.4424, "step": 104 }, { "epoch": 0.0, "learning_rate": 1.9108280254777074e-06, "loss": 2.52, "step": 105 }, { "epoch": 0.0, "learning_rate": 1.929026387625114e-06, "loss": 2.3975, "step": 106 }, { "epoch": 0.0, "learning_rate": 1.9472247497725204e-06, "loss": 2.4907, "step": 107 }, { "epoch": 0.0, "learning_rate": 1.9654231119199273e-06, "loss": 2.3569, "step": 108 }, { "epoch": 0.0, "learning_rate": 1.983621474067334e-06, "loss": 2.4131, "step": 109 }, { "epoch": 0.0, "learning_rate": 2.001819836214741e-06, "loss": 2.5024, "step": 110 }, { "epoch": 0.0, "learning_rate": 2.0200181983621475e-06, "loss": 2.3818, "step": 111 }, { "epoch": 0.0, "learning_rate": 2.0382165605095544e-06, "loss": 2.4004, "step": 112 }, { "epoch": 0.0, "learning_rate": 2.056414922656961e-06, "loss": 2.4458, "step": 113 }, { "epoch": 0.0, "learning_rate": 2.074613284804368e-06, "loss": 2.4648, "step": 114 }, { "epoch": 0.0, "learning_rate": 2.0928116469517747e-06, "loss": 2.5591, "step": 115 }, { "epoch": 0.0, "learning_rate": 2.111010009099181e-06, "loss": 2.3154, "step": 116 }, { "epoch": 0.0, "learning_rate": 2.129208371246588e-06, "loss": 2.3804, "step": 117 }, { "epoch": 0.0, "learning_rate": 2.1474067333939946e-06, "loss": 2.4517, "step": 118 }, { "epoch": 0.0, "learning_rate": 2.1656050955414015e-06, "loss": 2.3672, "step": 119 }, { "epoch": 0.0, "learning_rate": 2.183803457688808e-06, "loss": 2.3359, "step": 120 }, { "epoch": 0.0, "learning_rate": 2.202001819836215e-06, "loss": 2.2822, "step": 121 }, { "epoch": 0.0, "learning_rate": 2.2202001819836217e-06, "loss": 2.4136, "step": 122 }, { "epoch": 0.0, "learning_rate": 2.2383985441310286e-06, "loss": 2.2852, "step": 123 }, { "epoch": 0.0, "learning_rate": 2.256596906278435e-06, "loss": 2.4414, "step": 124 }, { "epoch": 0.0, "learning_rate": 2.2747952684258416e-06, "loss": 2.4702, "step": 125 }, { "epoch": 0.0, "learning_rate": 2.2929936305732485e-06, "loss": 2.2754, "step": 126 }, { "epoch": 0.0, "learning_rate": 2.3111919927206554e-06, "loss": 2.5259, "step": 127 }, { "epoch": 0.0, "learning_rate": 2.3293903548680623e-06, "loss": 2.3066, "step": 128 }, { "epoch": 0.0, "learning_rate": 2.3475887170154688e-06, "loss": 2.3047, "step": 129 }, { "epoch": 0.0, "learning_rate": 2.3657870791628757e-06, "loss": 2.3105, "step": 130 }, { "epoch": 0.0, "learning_rate": 2.383985441310282e-06, "loss": 2.3218, "step": 131 }, { "epoch": 0.0, "learning_rate": 2.402183803457689e-06, "loss": 2.4043, "step": 132 }, { "epoch": 0.0, "learning_rate": 2.420382165605096e-06, "loss": 2.2646, "step": 133 }, { "epoch": 0.0, "learning_rate": 2.4385805277525024e-06, "loss": 2.3335, "step": 134 }, { "epoch": 0.0, "learning_rate": 2.4567788898999093e-06, "loss": 2.3789, "step": 135 }, { "epoch": 0.0, "learning_rate": 2.4749772520473158e-06, "loss": 2.3291, "step": 136 }, { "epoch": 0.0, "learning_rate": 2.4931756141947227e-06, "loss": 2.1895, "step": 137 }, { "epoch": 0.0, "learning_rate": 2.5113739763421296e-06, "loss": 2.3477, "step": 138 }, { "epoch": 0.0, "learning_rate": 2.529572338489536e-06, "loss": 2.3608, "step": 139 }, { "epoch": 0.0, "learning_rate": 2.547770700636943e-06, "loss": 2.3467, "step": 140 }, { "epoch": 0.0, "learning_rate": 2.56596906278435e-06, "loss": 2.1938, "step": 141 }, { "epoch": 0.0, "learning_rate": 2.584167424931756e-06, "loss": 2.2598, "step": 142 }, { "epoch": 0.0, "learning_rate": 2.602365787079163e-06, "loss": 2.2993, "step": 143 }, { "epoch": 0.0, "learning_rate": 2.6205641492265697e-06, "loss": 2.1401, "step": 144 }, { "epoch": 0.0, "learning_rate": 2.6387625113739766e-06, "loss": 2.2808, "step": 145 }, { "epoch": 0.0, "learning_rate": 2.656960873521383e-06, "loss": 2.123, "step": 146 }, { "epoch": 0.0, "learning_rate": 2.67515923566879e-06, "loss": 2.2319, "step": 147 }, { "epoch": 0.0, "learning_rate": 2.693357597816197e-06, "loss": 2.29, "step": 148 }, { "epoch": 0.0, "learning_rate": 2.7115559599636038e-06, "loss": 2.1377, "step": 149 }, { "epoch": 0.0, "learning_rate": 2.7297543221110102e-06, "loss": 2.146, "step": 150 }, { "epoch": 0.0, "learning_rate": 2.747952684258417e-06, "loss": 2.2339, "step": 151 }, { "epoch": 0.0, "learning_rate": 2.766151046405824e-06, "loss": 2.2217, "step": 152 }, { "epoch": 0.0, "learning_rate": 2.78434940855323e-06, "loss": 2.0503, "step": 153 }, { "epoch": 0.0, "learning_rate": 2.802547770700637e-06, "loss": 2.1567, "step": 154 }, { "epoch": 0.0, "learning_rate": 2.820746132848044e-06, "loss": 2.0674, "step": 155 }, { "epoch": 0.0, "learning_rate": 2.8389444949954508e-06, "loss": 2.0879, "step": 156 }, { "epoch": 0.0, "learning_rate": 2.8571428571428573e-06, "loss": 2.1631, "step": 157 }, { "epoch": 0.0, "learning_rate": 2.875341219290264e-06, "loss": 2.146, "step": 158 }, { "epoch": 0.0, "learning_rate": 2.893539581437671e-06, "loss": 2.2368, "step": 159 }, { "epoch": 0.0, "learning_rate": 2.9117379435850775e-06, "loss": 2.2476, "step": 160 }, { "epoch": 0.0, "learning_rate": 2.9299363057324844e-06, "loss": 2.022, "step": 161 }, { "epoch": 0.0, "learning_rate": 2.948134667879891e-06, "loss": 2.0845, "step": 162 }, { "epoch": 0.0, "learning_rate": 2.966333030027298e-06, "loss": 2.1514, "step": 163 }, { "epoch": 0.0, "learning_rate": 2.9845313921747043e-06, "loss": 2.0098, "step": 164 }, { "epoch": 0.0, "learning_rate": 3.002729754322111e-06, "loss": 1.9971, "step": 165 }, { "epoch": 0.0, "learning_rate": 3.020928116469518e-06, "loss": 2.0869, "step": 166 }, { "epoch": 0.0, "learning_rate": 3.039126478616925e-06, "loss": 1.9697, "step": 167 }, { "epoch": 0.0, "learning_rate": 3.0573248407643314e-06, "loss": 2.064, "step": 168 }, { "epoch": 0.0, "learning_rate": 3.0755232029117383e-06, "loss": 2.0859, "step": 169 }, { "epoch": 0.0, "learning_rate": 3.0937215650591452e-06, "loss": 2.1562, "step": 170 }, { "epoch": 0.0, "learning_rate": 3.1119199272065513e-06, "loss": 2.2632, "step": 171 }, { "epoch": 0.0, "learning_rate": 3.130118289353958e-06, "loss": 2.1382, "step": 172 }, { "epoch": 0.0, "learning_rate": 3.148316651501365e-06, "loss": 2.0679, "step": 173 }, { "epoch": 0.0, "learning_rate": 3.166515013648772e-06, "loss": 2.0923, "step": 174 }, { "epoch": 0.0, "learning_rate": 3.1847133757961785e-06, "loss": 2.062, "step": 175 }, { "epoch": 0.0, "learning_rate": 3.2029117379435854e-06, "loss": 2.2598, "step": 176 }, { "epoch": 0.0, "learning_rate": 3.2211101000909923e-06, "loss": 2.0942, "step": 177 }, { "epoch": 0.0, "learning_rate": 3.2393084622383987e-06, "loss": 2.1816, "step": 178 }, { "epoch": 0.0, "learning_rate": 3.2575068243858056e-06, "loss": 2.1626, "step": 179 }, { "epoch": 0.0, "learning_rate": 3.2757051865332125e-06, "loss": 2.1084, "step": 180 }, { "epoch": 0.0, "learning_rate": 3.2939035486806194e-06, "loss": 2.2305, "step": 181 }, { "epoch": 0.0, "learning_rate": 3.3121019108280255e-06, "loss": 2.0737, "step": 182 }, { "epoch": 0.0, "learning_rate": 3.3303002729754324e-06, "loss": 2.0371, "step": 183 }, { "epoch": 0.01, "learning_rate": 3.3484986351228393e-06, "loss": 2.1147, "step": 184 }, { "epoch": 0.01, "learning_rate": 3.3666969972702458e-06, "loss": 2.1499, "step": 185 }, { "epoch": 0.01, "learning_rate": 3.3848953594176527e-06, "loss": 2.1362, "step": 186 }, { "epoch": 0.01, "learning_rate": 3.4030937215650596e-06, "loss": 2.0913, "step": 187 }, { "epoch": 0.01, "learning_rate": 3.4212920837124665e-06, "loss": 2.1279, "step": 188 }, { "epoch": 0.01, "learning_rate": 3.4394904458598725e-06, "loss": 2.2202, "step": 189 }, { "epoch": 0.01, "learning_rate": 3.4576888080072794e-06, "loss": 1.9829, "step": 190 }, { "epoch": 0.01, "learning_rate": 3.4758871701546863e-06, "loss": 1.9634, "step": 191 }, { "epoch": 0.01, "learning_rate": 3.494085532302093e-06, "loss": 1.8213, "step": 192 }, { "epoch": 0.01, "learning_rate": 3.5122838944494997e-06, "loss": 1.9927, "step": 193 }, { "epoch": 0.01, "learning_rate": 3.5304822565969066e-06, "loss": 1.9473, "step": 194 }, { "epoch": 0.01, "learning_rate": 3.5486806187443135e-06, "loss": 2.168, "step": 195 }, { "epoch": 0.01, "learning_rate": 3.56687898089172e-06, "loss": 2.1313, "step": 196 }, { "epoch": 0.01, "learning_rate": 3.585077343039127e-06, "loss": 2.0078, "step": 197 }, { "epoch": 0.01, "learning_rate": 3.6032757051865337e-06, "loss": 2.127, "step": 198 }, { "epoch": 0.01, "learning_rate": 3.6214740673339406e-06, "loss": 2.1157, "step": 199 }, { "epoch": 0.01, "learning_rate": 3.6396724294813467e-06, "loss": 2.0137, "step": 200 }, { "epoch": 0.01, "learning_rate": 3.6578707916287536e-06, "loss": 2.0742, "step": 201 }, { "epoch": 0.01, "learning_rate": 3.6760691537761605e-06, "loss": 2.0752, "step": 202 }, { "epoch": 0.01, "learning_rate": 3.694267515923567e-06, "loss": 2.2163, "step": 203 }, { "epoch": 0.01, "learning_rate": 3.712465878070974e-06, "loss": 2.0688, "step": 204 }, { "epoch": 0.01, "learning_rate": 3.7306642402183808e-06, "loss": 2.0215, "step": 205 }, { "epoch": 0.01, "learning_rate": 3.7488626023657877e-06, "loss": 1.9053, "step": 206 }, { "epoch": 0.01, "learning_rate": 3.7670609645131937e-06, "loss": 1.9043, "step": 207 }, { "epoch": 0.01, "learning_rate": 3.7852593266606006e-06, "loss": 1.9717, "step": 208 }, { "epoch": 0.01, "learning_rate": 3.8034576888080075e-06, "loss": 2.1182, "step": 209 }, { "epoch": 0.01, "learning_rate": 3.821656050955415e-06, "loss": 2.0254, "step": 210 }, { "epoch": 0.01, "learning_rate": 3.839854413102821e-06, "loss": 2.0542, "step": 211 }, { "epoch": 0.01, "learning_rate": 3.858052775250228e-06, "loss": 1.9033, "step": 212 }, { "epoch": 0.01, "learning_rate": 3.876251137397635e-06, "loss": 1.9385, "step": 213 }, { "epoch": 0.01, "learning_rate": 3.894449499545041e-06, "loss": 1.897, "step": 214 }, { "epoch": 0.01, "learning_rate": 3.912647861692448e-06, "loss": 2.1455, "step": 215 }, { "epoch": 0.01, "learning_rate": 3.9308462238398545e-06, "loss": 2.0381, "step": 216 }, { "epoch": 0.01, "learning_rate": 3.949044585987262e-06, "loss": 1.9517, "step": 217 }, { "epoch": 0.01, "learning_rate": 3.967242948134668e-06, "loss": 2.0698, "step": 218 }, { "epoch": 0.01, "learning_rate": 3.985441310282075e-06, "loss": 2.0259, "step": 219 }, { "epoch": 0.01, "learning_rate": 4.003639672429482e-06, "loss": 1.9214, "step": 220 }, { "epoch": 0.01, "learning_rate": 4.021838034576888e-06, "loss": 1.96, "step": 221 }, { "epoch": 0.01, "learning_rate": 4.040036396724295e-06, "loss": 1.9829, "step": 222 }, { "epoch": 0.01, "learning_rate": 4.0582347588717016e-06, "loss": 1.9165, "step": 223 }, { "epoch": 0.01, "learning_rate": 4.076433121019109e-06, "loss": 1.9414, "step": 224 }, { "epoch": 0.01, "learning_rate": 4.094631483166515e-06, "loss": 1.9287, "step": 225 }, { "epoch": 0.01, "learning_rate": 4.112829845313922e-06, "loss": 1.9878, "step": 226 }, { "epoch": 0.01, "learning_rate": 4.131028207461329e-06, "loss": 1.792, "step": 227 }, { "epoch": 0.01, "learning_rate": 4.149226569608736e-06, "loss": 1.9888, "step": 228 }, { "epoch": 0.01, "learning_rate": 4.167424931756142e-06, "loss": 2.1455, "step": 229 }, { "epoch": 0.01, "learning_rate": 4.185623293903549e-06, "loss": 2.0527, "step": 230 }, { "epoch": 0.01, "learning_rate": 4.203821656050956e-06, "loss": 1.9067, "step": 231 }, { "epoch": 0.01, "learning_rate": 4.222020018198362e-06, "loss": 1.853, "step": 232 }, { "epoch": 0.01, "learning_rate": 4.240218380345769e-06, "loss": 2.0669, "step": 233 }, { "epoch": 0.01, "learning_rate": 4.258416742493176e-06, "loss": 1.9707, "step": 234 }, { "epoch": 0.01, "learning_rate": 4.276615104640583e-06, "loss": 1.9253, "step": 235 }, { "epoch": 0.01, "learning_rate": 4.294813466787989e-06, "loss": 1.8408, "step": 236 }, { "epoch": 0.01, "learning_rate": 4.3130118289353964e-06, "loss": 2.0337, "step": 237 }, { "epoch": 0.01, "learning_rate": 4.331210191082803e-06, "loss": 2.0479, "step": 238 }, { "epoch": 0.01, "learning_rate": 4.349408553230209e-06, "loss": 1.6367, "step": 239 }, { "epoch": 0.01, "learning_rate": 4.367606915377616e-06, "loss": 1.9797, "step": 240 }, { "epoch": 0.01, "learning_rate": 4.385805277525023e-06, "loss": 2.0981, "step": 241 }, { "epoch": 0.01, "learning_rate": 4.40400363967243e-06, "loss": 2.0181, "step": 242 }, { "epoch": 0.01, "learning_rate": 4.422202001819836e-06, "loss": 1.896, "step": 243 }, { "epoch": 0.01, "learning_rate": 4.4404003639672435e-06, "loss": 1.8091, "step": 244 }, { "epoch": 0.01, "learning_rate": 4.45859872611465e-06, "loss": 1.7744, "step": 245 }, { "epoch": 0.01, "learning_rate": 4.476797088262057e-06, "loss": 1.8418, "step": 246 }, { "epoch": 0.01, "learning_rate": 4.494995450409464e-06, "loss": 1.9771, "step": 247 }, { "epoch": 0.01, "learning_rate": 4.51319381255687e-06, "loss": 1.7051, "step": 248 }, { "epoch": 0.01, "learning_rate": 4.5313921747042775e-06, "loss": 2.0386, "step": 249 }, { "epoch": 0.01, "learning_rate": 4.549590536851683e-06, "loss": 2.0615, "step": 250 }, { "epoch": 0.01, "learning_rate": 4.5677888989990905e-06, "loss": 2.001, "step": 251 }, { "epoch": 0.01, "learning_rate": 4.585987261146497e-06, "loss": 1.9517, "step": 252 }, { "epoch": 0.01, "learning_rate": 4.604185623293904e-06, "loss": 1.9087, "step": 253 }, { "epoch": 0.01, "learning_rate": 4.622383985441311e-06, "loss": 1.9058, "step": 254 }, { "epoch": 0.01, "learning_rate": 4.640582347588717e-06, "loss": 2.0244, "step": 255 }, { "epoch": 0.01, "learning_rate": 4.6587807097361246e-06, "loss": 1.9404, "step": 256 }, { "epoch": 0.01, "learning_rate": 4.676979071883531e-06, "loss": 1.9663, "step": 257 }, { "epoch": 0.01, "learning_rate": 4.6951774340309375e-06, "loss": 1.895, "step": 258 }, { "epoch": 0.01, "learning_rate": 4.713375796178344e-06, "loss": 1.9165, "step": 259 }, { "epoch": 0.01, "learning_rate": 4.731574158325751e-06, "loss": 2.0225, "step": 260 }, { "epoch": 0.01, "learning_rate": 4.749772520473158e-06, "loss": 2.0762, "step": 261 }, { "epoch": 0.01, "learning_rate": 4.767970882620564e-06, "loss": 1.9458, "step": 262 }, { "epoch": 0.01, "learning_rate": 4.7861692447679716e-06, "loss": 1.9204, "step": 263 }, { "epoch": 0.01, "learning_rate": 4.804367606915378e-06, "loss": 1.7871, "step": 264 }, { "epoch": 0.01, "learning_rate": 4.8225659690627845e-06, "loss": 1.9458, "step": 265 }, { "epoch": 0.01, "learning_rate": 4.840764331210192e-06, "loss": 2.0337, "step": 266 }, { "epoch": 0.01, "learning_rate": 4.858962693357598e-06, "loss": 1.916, "step": 267 }, { "epoch": 0.01, "learning_rate": 4.877161055505005e-06, "loss": 1.918, "step": 268 }, { "epoch": 0.01, "learning_rate": 4.895359417652411e-06, "loss": 1.8369, "step": 269 }, { "epoch": 0.01, "learning_rate": 4.913557779799819e-06, "loss": 1.7515, "step": 270 }, { "epoch": 0.01, "learning_rate": 4.931756141947225e-06, "loss": 2.0, "step": 271 }, { "epoch": 0.01, "learning_rate": 4.9499545040946315e-06, "loss": 1.9062, "step": 272 }, { "epoch": 0.01, "learning_rate": 4.968152866242039e-06, "loss": 1.79, "step": 273 }, { "epoch": 0.01, "learning_rate": 4.986351228389445e-06, "loss": 1.8677, "step": 274 }, { "epoch": 0.01, "learning_rate": 5.004549590536853e-06, "loss": 1.8491, "step": 275 }, { "epoch": 0.01, "learning_rate": 5.022747952684259e-06, "loss": 1.8569, "step": 276 }, { "epoch": 0.01, "learning_rate": 5.040946314831665e-06, "loss": 1.8516, "step": 277 }, { "epoch": 0.01, "learning_rate": 5.059144676979072e-06, "loss": 1.9927, "step": 278 }, { "epoch": 0.01, "learning_rate": 5.0773430391264786e-06, "loss": 1.9736, "step": 279 }, { "epoch": 0.01, "learning_rate": 5.095541401273886e-06, "loss": 1.8525, "step": 280 }, { "epoch": 0.01, "learning_rate": 5.113739763421292e-06, "loss": 1.7935, "step": 281 }, { "epoch": 0.01, "learning_rate": 5.1319381255687e-06, "loss": 1.8237, "step": 282 }, { "epoch": 0.01, "learning_rate": 5.150136487716106e-06, "loss": 1.9312, "step": 283 }, { "epoch": 0.01, "learning_rate": 5.168334849863512e-06, "loss": 1.8809, "step": 284 }, { "epoch": 0.01, "learning_rate": 5.186533212010919e-06, "loss": 1.8623, "step": 285 }, { "epoch": 0.01, "learning_rate": 5.204731574158326e-06, "loss": 2.0127, "step": 286 }, { "epoch": 0.01, "learning_rate": 5.222929936305733e-06, "loss": 1.8452, "step": 287 }, { "epoch": 0.01, "learning_rate": 5.241128298453139e-06, "loss": 1.9927, "step": 288 }, { "epoch": 0.01, "learning_rate": 5.259326660600547e-06, "loss": 1.769, "step": 289 }, { "epoch": 0.01, "learning_rate": 5.277525022747953e-06, "loss": 1.7656, "step": 290 }, { "epoch": 0.01, "learning_rate": 5.29572338489536e-06, "loss": 1.9707, "step": 291 }, { "epoch": 0.01, "learning_rate": 5.313921747042766e-06, "loss": 2.0088, "step": 292 }, { "epoch": 0.01, "learning_rate": 5.3321201091901735e-06, "loss": 1.8638, "step": 293 }, { "epoch": 0.01, "learning_rate": 5.35031847133758e-06, "loss": 1.957, "step": 294 }, { "epoch": 0.01, "learning_rate": 5.368516833484987e-06, "loss": 2.0605, "step": 295 }, { "epoch": 0.01, "learning_rate": 5.386715195632394e-06, "loss": 1.8735, "step": 296 }, { "epoch": 0.01, "learning_rate": 5.404913557779801e-06, "loss": 2.1338, "step": 297 }, { "epoch": 0.01, "learning_rate": 5.4231119199272075e-06, "loss": 1.9766, "step": 298 }, { "epoch": 0.01, "learning_rate": 5.441310282074613e-06, "loss": 1.9043, "step": 299 }, { "epoch": 0.01, "learning_rate": 5.4595086442220205e-06, "loss": 1.8062, "step": 300 }, { "epoch": 0.01, "learning_rate": 5.477707006369427e-06, "loss": 2.0312, "step": 301 }, { "epoch": 0.01, "learning_rate": 5.495905368516834e-06, "loss": 1.7822, "step": 302 }, { "epoch": 0.01, "learning_rate": 5.514103730664241e-06, "loss": 1.7803, "step": 303 }, { "epoch": 0.01, "learning_rate": 5.532302092811648e-06, "loss": 1.8936, "step": 304 }, { "epoch": 0.01, "learning_rate": 5.5505004549590545e-06, "loss": 1.9463, "step": 305 }, { "epoch": 0.01, "learning_rate": 5.56869881710646e-06, "loss": 2.0327, "step": 306 }, { "epoch": 0.01, "learning_rate": 5.5868971792538675e-06, "loss": 1.9399, "step": 307 }, { "epoch": 0.01, "learning_rate": 5.605095541401274e-06, "loss": 2.0142, "step": 308 }, { "epoch": 0.01, "learning_rate": 5.623293903548681e-06, "loss": 1.7539, "step": 309 }, { "epoch": 0.01, "learning_rate": 5.641492265696088e-06, "loss": 1.957, "step": 310 }, { "epoch": 0.01, "learning_rate": 5.659690627843495e-06, "loss": 1.7666, "step": 311 }, { "epoch": 0.01, "learning_rate": 5.6778889899909016e-06, "loss": 1.7681, "step": 312 }, { "epoch": 0.01, "learning_rate": 5.696087352138307e-06, "loss": 1.8296, "step": 313 }, { "epoch": 0.01, "learning_rate": 5.7142857142857145e-06, "loss": 1.9331, "step": 314 }, { "epoch": 0.01, "learning_rate": 5.732484076433121e-06, "loss": 1.7847, "step": 315 }, { "epoch": 0.01, "learning_rate": 5.750682438580528e-06, "loss": 1.9233, "step": 316 }, { "epoch": 0.01, "learning_rate": 5.768880800727935e-06, "loss": 1.832, "step": 317 }, { "epoch": 0.01, "learning_rate": 5.787079162875342e-06, "loss": 2.0327, "step": 318 }, { "epoch": 0.01, "learning_rate": 5.805277525022749e-06, "loss": 1.8696, "step": 319 }, { "epoch": 0.01, "learning_rate": 5.823475887170155e-06, "loss": 2.0151, "step": 320 }, { "epoch": 0.01, "learning_rate": 5.8416742493175615e-06, "loss": 1.874, "step": 321 }, { "epoch": 0.01, "learning_rate": 5.859872611464969e-06, "loss": 1.7144, "step": 322 }, { "epoch": 0.01, "learning_rate": 5.878070973612375e-06, "loss": 1.554, "step": 323 }, { "epoch": 0.01, "learning_rate": 5.896269335759782e-06, "loss": 1.9658, "step": 324 }, { "epoch": 0.01, "learning_rate": 5.914467697907189e-06, "loss": 2.0171, "step": 325 }, { "epoch": 0.01, "learning_rate": 5.932666060054596e-06, "loss": 1.7739, "step": 326 }, { "epoch": 0.01, "learning_rate": 5.950864422202002e-06, "loss": 2.0459, "step": 327 }, { "epoch": 0.01, "learning_rate": 5.9690627843494086e-06, "loss": 1.8569, "step": 328 }, { "epoch": 0.01, "learning_rate": 5.987261146496816e-06, "loss": 1.9546, "step": 329 }, { "epoch": 0.01, "learning_rate": 6.005459508644222e-06, "loss": 1.9434, "step": 330 }, { "epoch": 0.01, "learning_rate": 6.02365787079163e-06, "loss": 1.8403, "step": 331 }, { "epoch": 0.01, "learning_rate": 6.041856232939036e-06, "loss": 1.8311, "step": 332 }, { "epoch": 0.01, "learning_rate": 6.0600545950864435e-06, "loss": 1.7217, "step": 333 }, { "epoch": 0.01, "learning_rate": 6.07825295723385e-06, "loss": 1.9077, "step": 334 }, { "epoch": 0.01, "learning_rate": 6.0964513193812556e-06, "loss": 2.0752, "step": 335 }, { "epoch": 0.01, "learning_rate": 6.114649681528663e-06, "loss": 1.8271, "step": 336 }, { "epoch": 0.01, "learning_rate": 6.132848043676069e-06, "loss": 1.9731, "step": 337 }, { "epoch": 0.01, "learning_rate": 6.151046405823477e-06, "loss": 1.7852, "step": 338 }, { "epoch": 0.01, "learning_rate": 6.169244767970883e-06, "loss": 1.8818, "step": 339 }, { "epoch": 0.01, "learning_rate": 6.1874431301182905e-06, "loss": 1.9414, "step": 340 }, { "epoch": 0.01, "learning_rate": 6.205641492265697e-06, "loss": 1.7192, "step": 341 }, { "epoch": 0.01, "learning_rate": 6.223839854413103e-06, "loss": 1.9688, "step": 342 }, { "epoch": 0.01, "learning_rate": 6.24203821656051e-06, "loss": 1.7944, "step": 343 }, { "epoch": 0.01, "learning_rate": 6.260236578707916e-06, "loss": 1.9683, "step": 344 }, { "epoch": 0.01, "learning_rate": 6.278434940855324e-06, "loss": 1.6313, "step": 345 }, { "epoch": 0.01, "learning_rate": 6.29663330300273e-06, "loss": 1.834, "step": 346 }, { "epoch": 0.01, "learning_rate": 6.3148316651501375e-06, "loss": 1.8306, "step": 347 }, { "epoch": 0.01, "learning_rate": 6.333030027297544e-06, "loss": 1.9712, "step": 348 }, { "epoch": 0.01, "learning_rate": 6.35122838944495e-06, "loss": 1.707, "step": 349 }, { "epoch": 0.01, "learning_rate": 6.369426751592357e-06, "loss": 1.8384, "step": 350 }, { "epoch": 0.01, "learning_rate": 6.387625113739763e-06, "loss": 2.0405, "step": 351 }, { "epoch": 0.01, "learning_rate": 6.405823475887171e-06, "loss": 1.7153, "step": 352 }, { "epoch": 0.01, "learning_rate": 6.424021838034577e-06, "loss": 1.6797, "step": 353 }, { "epoch": 0.01, "learning_rate": 6.4422202001819845e-06, "loss": 1.5688, "step": 354 }, { "epoch": 0.01, "learning_rate": 6.460418562329391e-06, "loss": 1.9204, "step": 355 }, { "epoch": 0.01, "learning_rate": 6.4786169244767975e-06, "loss": 1.9233, "step": 356 }, { "epoch": 0.01, "learning_rate": 6.496815286624204e-06, "loss": 1.561, "step": 357 }, { "epoch": 0.01, "learning_rate": 6.515013648771611e-06, "loss": 1.8638, "step": 358 }, { "epoch": 0.01, "learning_rate": 6.533212010919018e-06, "loss": 1.8667, "step": 359 }, { "epoch": 0.01, "learning_rate": 6.551410373066425e-06, "loss": 1.7471, "step": 360 }, { "epoch": 0.01, "learning_rate": 6.5696087352138315e-06, "loss": 1.8442, "step": 361 }, { "epoch": 0.01, "learning_rate": 6.587807097361239e-06, "loss": 1.748, "step": 362 }, { "epoch": 0.01, "learning_rate": 6.6060054595086445e-06, "loss": 1.9048, "step": 363 }, { "epoch": 0.01, "learning_rate": 6.624203821656051e-06, "loss": 1.771, "step": 364 }, { "epoch": 0.01, "learning_rate": 6.642402183803458e-06, "loss": 1.8584, "step": 365 }, { "epoch": 0.01, "learning_rate": 6.660600545950865e-06, "loss": 1.7646, "step": 366 }, { "epoch": 0.01, "learning_rate": 6.678798908098272e-06, "loss": 1.9229, "step": 367 }, { "epoch": 0.01, "learning_rate": 6.6969972702456786e-06, "loss": 1.9175, "step": 368 }, { "epoch": 0.01, "learning_rate": 6.715195632393086e-06, "loss": 2.105, "step": 369 }, { "epoch": 0.01, "learning_rate": 6.7333939945404915e-06, "loss": 1.9006, "step": 370 }, { "epoch": 0.01, "learning_rate": 6.751592356687898e-06, "loss": 1.8389, "step": 371 }, { "epoch": 0.01, "learning_rate": 6.769790718835305e-06, "loss": 1.7168, "step": 372 }, { "epoch": 0.01, "learning_rate": 6.787989080982712e-06, "loss": 1.7798, "step": 373 }, { "epoch": 0.01, "learning_rate": 6.806187443130119e-06, "loss": 1.959, "step": 374 }, { "epoch": 0.01, "learning_rate": 6.824385805277526e-06, "loss": 1.7681, "step": 375 }, { "epoch": 0.01, "learning_rate": 6.842584167424933e-06, "loss": 1.7456, "step": 376 }, { "epoch": 0.01, "learning_rate": 6.860782529572339e-06, "loss": 1.7017, "step": 377 }, { "epoch": 0.01, "learning_rate": 6.878980891719745e-06, "loss": 1.8735, "step": 378 }, { "epoch": 0.01, "learning_rate": 6.897179253867152e-06, "loss": 1.853, "step": 379 }, { "epoch": 0.01, "learning_rate": 6.915377616014559e-06, "loss": 1.7344, "step": 380 }, { "epoch": 0.01, "learning_rate": 6.933575978161966e-06, "loss": 1.842, "step": 381 }, { "epoch": 0.01, "learning_rate": 6.951774340309373e-06, "loss": 1.7256, "step": 382 }, { "epoch": 0.01, "learning_rate": 6.96997270245678e-06, "loss": 1.8135, "step": 383 }, { "epoch": 0.01, "learning_rate": 6.988171064604186e-06, "loss": 1.6079, "step": 384 }, { "epoch": 0.01, "learning_rate": 7.006369426751593e-06, "loss": 1.9834, "step": 385 }, { "epoch": 0.01, "learning_rate": 7.024567788898999e-06, "loss": 1.863, "step": 386 }, { "epoch": 0.01, "learning_rate": 7.042766151046407e-06, "loss": 1.895, "step": 387 }, { "epoch": 0.01, "learning_rate": 7.060964513193813e-06, "loss": 1.7983, "step": 388 }, { "epoch": 0.01, "learning_rate": 7.07916287534122e-06, "loss": 1.646, "step": 389 }, { "epoch": 0.01, "learning_rate": 7.097361237488627e-06, "loss": 1.8267, "step": 390 }, { "epoch": 0.01, "learning_rate": 7.1155595996360334e-06, "loss": 1.8325, "step": 391 }, { "epoch": 0.01, "learning_rate": 7.13375796178344e-06, "loss": 1.6475, "step": 392 }, { "epoch": 0.01, "learning_rate": 7.151956323930846e-06, "loss": 1.8799, "step": 393 }, { "epoch": 0.01, "learning_rate": 7.170154686078254e-06, "loss": 1.7417, "step": 394 }, { "epoch": 0.01, "learning_rate": 7.18835304822566e-06, "loss": 1.7725, "step": 395 }, { "epoch": 0.01, "learning_rate": 7.2065514103730675e-06, "loss": 1.8496, "step": 396 }, { "epoch": 0.01, "learning_rate": 7.224749772520474e-06, "loss": 1.8652, "step": 397 }, { "epoch": 0.01, "learning_rate": 7.242948134667881e-06, "loss": 1.9023, "step": 398 }, { "epoch": 0.01, "learning_rate": 7.261146496815287e-06, "loss": 1.8843, "step": 399 }, { "epoch": 0.01, "learning_rate": 7.279344858962693e-06, "loss": 2.0747, "step": 400 }, { "epoch": 0.01, "learning_rate": 7.297543221110101e-06, "loss": 1.8828, "step": 401 }, { "epoch": 0.01, "learning_rate": 7.315741583257507e-06, "loss": 1.832, "step": 402 }, { "epoch": 0.01, "learning_rate": 7.3339399454049145e-06, "loss": 1.8569, "step": 403 }, { "epoch": 0.01, "learning_rate": 7.352138307552321e-06, "loss": 1.834, "step": 404 }, { "epoch": 0.01, "learning_rate": 7.370336669699728e-06, "loss": 1.8691, "step": 405 }, { "epoch": 0.01, "learning_rate": 7.388535031847134e-06, "loss": 1.873, "step": 406 }, { "epoch": 0.01, "learning_rate": 7.40673339399454e-06, "loss": 1.9028, "step": 407 }, { "epoch": 0.01, "learning_rate": 7.424931756141948e-06, "loss": 1.8232, "step": 408 }, { "epoch": 0.01, "learning_rate": 7.443130118289354e-06, "loss": 1.7305, "step": 409 }, { "epoch": 0.01, "learning_rate": 7.4613284804367615e-06, "loss": 1.6816, "step": 410 }, { "epoch": 0.01, "learning_rate": 7.479526842584168e-06, "loss": 1.7866, "step": 411 }, { "epoch": 0.01, "learning_rate": 7.497725204731575e-06, "loss": 1.7798, "step": 412 }, { "epoch": 0.01, "learning_rate": 7.515923566878982e-06, "loss": 1.7065, "step": 413 }, { "epoch": 0.01, "learning_rate": 7.5341219290263874e-06, "loss": 1.7788, "step": 414 }, { "epoch": 0.01, "learning_rate": 7.552320291173795e-06, "loss": 1.8755, "step": 415 }, { "epoch": 0.01, "learning_rate": 7.570518653321201e-06, "loss": 1.7607, "step": 416 }, { "epoch": 0.01, "learning_rate": 7.5887170154686086e-06, "loss": 1.7593, "step": 417 }, { "epoch": 0.01, "learning_rate": 7.606915377616015e-06, "loss": 1.9575, "step": 418 }, { "epoch": 0.01, "learning_rate": 7.625113739763422e-06, "loss": 1.8574, "step": 419 }, { "epoch": 0.01, "learning_rate": 7.64331210191083e-06, "loss": 1.8228, "step": 420 }, { "epoch": 0.01, "learning_rate": 7.661510464058235e-06, "loss": 1.9771, "step": 421 }, { "epoch": 0.01, "learning_rate": 7.679708826205643e-06, "loss": 1.7573, "step": 422 }, { "epoch": 0.01, "learning_rate": 7.697907188353048e-06, "loss": 1.7065, "step": 423 }, { "epoch": 0.01, "learning_rate": 7.716105550500456e-06, "loss": 1.9517, "step": 424 }, { "epoch": 0.01, "learning_rate": 7.734303912647863e-06, "loss": 1.9468, "step": 425 }, { "epoch": 0.01, "learning_rate": 7.75250227479527e-06, "loss": 1.6118, "step": 426 }, { "epoch": 0.01, "learning_rate": 7.770700636942676e-06, "loss": 1.7856, "step": 427 }, { "epoch": 0.01, "learning_rate": 7.788898999090081e-06, "loss": 1.7227, "step": 428 }, { "epoch": 0.01, "learning_rate": 7.807097361237489e-06, "loss": 1.8765, "step": 429 }, { "epoch": 0.01, "learning_rate": 7.825295723384896e-06, "loss": 1.7012, "step": 430 }, { "epoch": 0.01, "learning_rate": 7.843494085532303e-06, "loss": 1.731, "step": 431 }, { "epoch": 0.01, "learning_rate": 7.861692447679709e-06, "loss": 1.8071, "step": 432 }, { "epoch": 0.01, "learning_rate": 7.879890809827116e-06, "loss": 1.6885, "step": 433 }, { "epoch": 0.01, "learning_rate": 7.898089171974524e-06, "loss": 1.8618, "step": 434 }, { "epoch": 0.01, "learning_rate": 7.91628753412193e-06, "loss": 1.792, "step": 435 }, { "epoch": 0.01, "learning_rate": 7.934485896269337e-06, "loss": 1.8379, "step": 436 }, { "epoch": 0.01, "learning_rate": 7.952684258416742e-06, "loss": 1.8203, "step": 437 }, { "epoch": 0.01, "learning_rate": 7.97088262056415e-06, "loss": 1.9448, "step": 438 }, { "epoch": 0.01, "learning_rate": 7.989080982711557e-06, "loss": 1.7285, "step": 439 }, { "epoch": 0.01, "learning_rate": 8.007279344858964e-06, "loss": 1.8008, "step": 440 }, { "epoch": 0.01, "learning_rate": 8.02547770700637e-06, "loss": 1.7832, "step": 441 }, { "epoch": 0.01, "learning_rate": 8.043676069153776e-06, "loss": 1.8389, "step": 442 }, { "epoch": 0.01, "learning_rate": 8.061874431301183e-06, "loss": 1.7368, "step": 443 }, { "epoch": 0.01, "learning_rate": 8.08007279344859e-06, "loss": 1.7358, "step": 444 }, { "epoch": 0.01, "learning_rate": 8.098271155595997e-06, "loss": 1.5437, "step": 445 }, { "epoch": 0.01, "learning_rate": 8.116469517743403e-06, "loss": 1.853, "step": 446 }, { "epoch": 0.01, "learning_rate": 8.13466787989081e-06, "loss": 1.8628, "step": 447 }, { "epoch": 0.01, "learning_rate": 8.152866242038218e-06, "loss": 1.8608, "step": 448 }, { "epoch": 0.01, "learning_rate": 8.171064604185623e-06, "loss": 1.8506, "step": 449 }, { "epoch": 0.01, "learning_rate": 8.18926296633303e-06, "loss": 1.7979, "step": 450 }, { "epoch": 0.01, "learning_rate": 8.207461328480438e-06, "loss": 2.0093, "step": 451 }, { "epoch": 0.01, "learning_rate": 8.225659690627844e-06, "loss": 1.7671, "step": 452 }, { "epoch": 0.01, "learning_rate": 8.243858052775251e-06, "loss": 1.7808, "step": 453 }, { "epoch": 0.01, "learning_rate": 8.262056414922658e-06, "loss": 1.9033, "step": 454 }, { "epoch": 0.01, "learning_rate": 8.280254777070064e-06, "loss": 1.6846, "step": 455 }, { "epoch": 0.01, "learning_rate": 8.298453139217471e-06, "loss": 1.9067, "step": 456 }, { "epoch": 0.01, "learning_rate": 8.316651501364877e-06, "loss": 1.7822, "step": 457 }, { "epoch": 0.01, "learning_rate": 8.334849863512284e-06, "loss": 1.9619, "step": 458 }, { "epoch": 0.01, "learning_rate": 8.353048225659692e-06, "loss": 1.7837, "step": 459 }, { "epoch": 0.01, "learning_rate": 8.371246587807099e-06, "loss": 1.7632, "step": 460 }, { "epoch": 0.01, "learning_rate": 8.389444949954504e-06, "loss": 1.7095, "step": 461 }, { "epoch": 0.01, "learning_rate": 8.407643312101912e-06, "loss": 1.73, "step": 462 }, { "epoch": 0.01, "learning_rate": 8.425841674249319e-06, "loss": 1.688, "step": 463 }, { "epoch": 0.01, "learning_rate": 8.444040036396725e-06, "loss": 1.5991, "step": 464 }, { "epoch": 0.01, "learning_rate": 8.462238398544132e-06, "loss": 1.7129, "step": 465 }, { "epoch": 0.01, "learning_rate": 8.480436760691538e-06, "loss": 1.7847, "step": 466 }, { "epoch": 0.01, "learning_rate": 8.498635122838945e-06, "loss": 1.6689, "step": 467 }, { "epoch": 0.01, "learning_rate": 8.516833484986352e-06, "loss": 1.7058, "step": 468 }, { "epoch": 0.01, "learning_rate": 8.53503184713376e-06, "loss": 1.6611, "step": 469 }, { "epoch": 0.01, "learning_rate": 8.553230209281165e-06, "loss": 1.894, "step": 470 }, { "epoch": 0.01, "learning_rate": 8.571428571428571e-06, "loss": 1.782, "step": 471 }, { "epoch": 0.01, "learning_rate": 8.589626933575978e-06, "loss": 1.8467, "step": 472 }, { "epoch": 0.01, "learning_rate": 8.607825295723386e-06, "loss": 1.6392, "step": 473 }, { "epoch": 0.01, "learning_rate": 8.626023657870793e-06, "loss": 1.7671, "step": 474 }, { "epoch": 0.01, "learning_rate": 8.644222020018199e-06, "loss": 1.6821, "step": 475 }, { "epoch": 0.01, "learning_rate": 8.662420382165606e-06, "loss": 1.7754, "step": 476 }, { "epoch": 0.01, "learning_rate": 8.680618744313013e-06, "loss": 1.9233, "step": 477 }, { "epoch": 0.01, "learning_rate": 8.698817106460419e-06, "loss": 1.9429, "step": 478 }, { "epoch": 0.01, "learning_rate": 8.717015468607826e-06, "loss": 1.8418, "step": 479 }, { "epoch": 0.01, "learning_rate": 8.735213830755232e-06, "loss": 1.8149, "step": 480 }, { "epoch": 0.01, "learning_rate": 8.753412192902639e-06, "loss": 1.8628, "step": 481 }, { "epoch": 0.01, "learning_rate": 8.771610555050046e-06, "loss": 1.8291, "step": 482 }, { "epoch": 0.01, "learning_rate": 8.789808917197454e-06, "loss": 1.666, "step": 483 }, { "epoch": 0.01, "learning_rate": 8.80800727934486e-06, "loss": 1.7549, "step": 484 }, { "epoch": 0.01, "learning_rate": 8.826205641492267e-06, "loss": 1.8843, "step": 485 }, { "epoch": 0.01, "learning_rate": 8.844404003639672e-06, "loss": 1.731, "step": 486 }, { "epoch": 0.01, "learning_rate": 8.86260236578708e-06, "loss": 1.7988, "step": 487 }, { "epoch": 0.01, "learning_rate": 8.880800727934487e-06, "loss": 2.0234, "step": 488 }, { "epoch": 0.01, "learning_rate": 8.898999090081894e-06, "loss": 1.7104, "step": 489 }, { "epoch": 0.01, "learning_rate": 8.9171974522293e-06, "loss": 1.9253, "step": 490 }, { "epoch": 0.01, "learning_rate": 8.935395814376707e-06, "loss": 1.834, "step": 491 }, { "epoch": 0.01, "learning_rate": 8.953594176524115e-06, "loss": 1.8555, "step": 492 }, { "epoch": 0.01, "learning_rate": 8.97179253867152e-06, "loss": 1.834, "step": 493 }, { "epoch": 0.01, "learning_rate": 8.989990900818927e-06, "loss": 1.5979, "step": 494 }, { "epoch": 0.01, "learning_rate": 9.008189262966333e-06, "loss": 1.8003, "step": 495 }, { "epoch": 0.01, "learning_rate": 9.02638762511374e-06, "loss": 1.8799, "step": 496 }, { "epoch": 0.01, "learning_rate": 9.044585987261148e-06, "loss": 1.6743, "step": 497 }, { "epoch": 0.01, "learning_rate": 9.062784349408555e-06, "loss": 1.8101, "step": 498 }, { "epoch": 0.01, "learning_rate": 9.08098271155596e-06, "loss": 1.7471, "step": 499 }, { "epoch": 0.01, "learning_rate": 9.099181073703366e-06, "loss": 1.8589, "step": 500 }, { "epoch": 0.01, "learning_rate": 9.117379435850774e-06, "loss": 1.8262, "step": 501 }, { "epoch": 0.01, "learning_rate": 9.135577797998181e-06, "loss": 1.936, "step": 502 }, { "epoch": 0.01, "learning_rate": 9.153776160145588e-06, "loss": 1.7832, "step": 503 }, { "epoch": 0.01, "learning_rate": 9.171974522292994e-06, "loss": 1.8022, "step": 504 }, { "epoch": 0.01, "learning_rate": 9.190172884440401e-06, "loss": 1.6743, "step": 505 }, { "epoch": 0.01, "learning_rate": 9.208371246587809e-06, "loss": 1.7051, "step": 506 }, { "epoch": 0.01, "learning_rate": 9.226569608735214e-06, "loss": 1.8179, "step": 507 }, { "epoch": 0.01, "learning_rate": 9.244767970882622e-06, "loss": 1.7881, "step": 508 }, { "epoch": 0.01, "learning_rate": 9.262966333030027e-06, "loss": 1.6152, "step": 509 }, { "epoch": 0.01, "learning_rate": 9.281164695177434e-06, "loss": 1.6978, "step": 510 }, { "epoch": 0.01, "learning_rate": 9.299363057324842e-06, "loss": 1.6904, "step": 511 }, { "epoch": 0.01, "learning_rate": 9.317561419472249e-06, "loss": 1.8286, "step": 512 }, { "epoch": 0.01, "learning_rate": 9.335759781619655e-06, "loss": 1.855, "step": 513 }, { "epoch": 0.01, "learning_rate": 9.353958143767062e-06, "loss": 1.5188, "step": 514 }, { "epoch": 0.01, "learning_rate": 9.372156505914468e-06, "loss": 1.7671, "step": 515 }, { "epoch": 0.01, "learning_rate": 9.390354868061875e-06, "loss": 1.748, "step": 516 }, { "epoch": 0.01, "learning_rate": 9.408553230209282e-06, "loss": 1.5769, "step": 517 }, { "epoch": 0.01, "learning_rate": 9.426751592356688e-06, "loss": 1.9067, "step": 518 }, { "epoch": 0.01, "learning_rate": 9.444949954504095e-06, "loss": 2.0137, "step": 519 }, { "epoch": 0.01, "learning_rate": 9.463148316651503e-06, "loss": 1.6714, "step": 520 }, { "epoch": 0.01, "learning_rate": 9.481346678798908e-06, "loss": 1.4714, "step": 521 }, { "epoch": 0.01, "learning_rate": 9.499545040946316e-06, "loss": 1.6921, "step": 522 }, { "epoch": 0.01, "learning_rate": 9.517743403093723e-06, "loss": 1.9556, "step": 523 }, { "epoch": 0.01, "learning_rate": 9.535941765241129e-06, "loss": 1.8481, "step": 524 }, { "epoch": 0.01, "learning_rate": 9.554140127388536e-06, "loss": 1.8521, "step": 525 }, { "epoch": 0.01, "learning_rate": 9.572338489535943e-06, "loss": 1.8384, "step": 526 }, { "epoch": 0.01, "learning_rate": 9.59053685168335e-06, "loss": 1.9214, "step": 527 }, { "epoch": 0.01, "learning_rate": 9.608735213830756e-06, "loss": 1.8147, "step": 528 }, { "epoch": 0.01, "learning_rate": 9.626933575978162e-06, "loss": 1.7168, "step": 529 }, { "epoch": 0.01, "learning_rate": 9.645131938125569e-06, "loss": 1.7456, "step": 530 }, { "epoch": 0.01, "learning_rate": 9.663330300272976e-06, "loss": 1.7905, "step": 531 }, { "epoch": 0.01, "learning_rate": 9.681528662420384e-06, "loss": 1.9629, "step": 532 }, { "epoch": 0.01, "learning_rate": 9.69972702456779e-06, "loss": 1.6213, "step": 533 }, { "epoch": 0.01, "learning_rate": 9.717925386715197e-06, "loss": 1.71, "step": 534 }, { "epoch": 0.01, "learning_rate": 9.736123748862604e-06, "loss": 1.7407, "step": 535 }, { "epoch": 0.01, "learning_rate": 9.75432211101001e-06, "loss": 1.7222, "step": 536 }, { "epoch": 0.01, "learning_rate": 9.772520473157417e-06, "loss": 1.7271, "step": 537 }, { "epoch": 0.01, "learning_rate": 9.790718835304823e-06, "loss": 1.7676, "step": 538 }, { "epoch": 0.01, "learning_rate": 9.80891719745223e-06, "loss": 1.6865, "step": 539 }, { "epoch": 0.01, "learning_rate": 9.827115559599637e-06, "loss": 1.8818, "step": 540 }, { "epoch": 0.01, "learning_rate": 9.845313921747045e-06, "loss": 1.6631, "step": 541 }, { "epoch": 0.01, "learning_rate": 9.86351228389445e-06, "loss": 1.8462, "step": 542 }, { "epoch": 0.01, "learning_rate": 9.881710646041856e-06, "loss": 1.8965, "step": 543 }, { "epoch": 0.01, "learning_rate": 9.899909008189263e-06, "loss": 1.8352, "step": 544 }, { "epoch": 0.01, "learning_rate": 9.91810737033667e-06, "loss": 1.6826, "step": 545 }, { "epoch": 0.01, "learning_rate": 9.936305732484078e-06, "loss": 1.7886, "step": 546 }, { "epoch": 0.01, "learning_rate": 9.954504094631483e-06, "loss": 1.7061, "step": 547 }, { "epoch": 0.01, "learning_rate": 9.97270245677889e-06, "loss": 1.833, "step": 548 }, { "epoch": 0.01, "learning_rate": 9.990900818926298e-06, "loss": 1.814, "step": 549 }, { "epoch": 0.02, "learning_rate": 1.0009099181073705e-05, "loss": 1.9102, "step": 550 }, { "epoch": 0.02, "learning_rate": 1.0027297543221111e-05, "loss": 1.7471, "step": 551 }, { "epoch": 0.02, "learning_rate": 1.0045495905368518e-05, "loss": 1.6963, "step": 552 }, { "epoch": 0.02, "learning_rate": 1.0063694267515924e-05, "loss": 1.9468, "step": 553 }, { "epoch": 0.02, "learning_rate": 1.008189262966333e-05, "loss": 1.7192, "step": 554 }, { "epoch": 0.02, "learning_rate": 1.0100090991810739e-05, "loss": 1.4895, "step": 555 }, { "epoch": 0.02, "learning_rate": 1.0118289353958144e-05, "loss": 1.7742, "step": 556 }, { "epoch": 0.02, "learning_rate": 1.0136487716105551e-05, "loss": 1.6665, "step": 557 }, { "epoch": 0.02, "learning_rate": 1.0154686078252957e-05, "loss": 1.7837, "step": 558 }, { "epoch": 0.02, "learning_rate": 1.0172884440400366e-05, "loss": 1.6958, "step": 559 }, { "epoch": 0.02, "learning_rate": 1.0191082802547772e-05, "loss": 1.7148, "step": 560 }, { "epoch": 0.02, "learning_rate": 1.0209281164695177e-05, "loss": 1.7664, "step": 561 }, { "epoch": 0.02, "learning_rate": 1.0227479526842585e-05, "loss": 1.7412, "step": 562 }, { "epoch": 0.02, "learning_rate": 1.024567788898999e-05, "loss": 1.8052, "step": 563 }, { "epoch": 0.02, "learning_rate": 1.02638762511374e-05, "loss": 1.7461, "step": 564 }, { "epoch": 0.02, "learning_rate": 1.0282074613284805e-05, "loss": 1.6333, "step": 565 }, { "epoch": 0.02, "learning_rate": 1.0300272975432212e-05, "loss": 1.7515, "step": 566 }, { "epoch": 0.02, "learning_rate": 1.0318471337579618e-05, "loss": 1.6606, "step": 567 }, { "epoch": 0.02, "learning_rate": 1.0336669699727024e-05, "loss": 1.7114, "step": 568 }, { "epoch": 0.02, "learning_rate": 1.0354868061874433e-05, "loss": 1.7388, "step": 569 }, { "epoch": 0.02, "learning_rate": 1.0373066424021838e-05, "loss": 1.8647, "step": 570 }, { "epoch": 0.02, "learning_rate": 1.0391264786169246e-05, "loss": 1.5376, "step": 571 }, { "epoch": 0.02, "learning_rate": 1.0409463148316651e-05, "loss": 1.8213, "step": 572 }, { "epoch": 0.02, "learning_rate": 1.042766151046406e-05, "loss": 1.7754, "step": 573 }, { "epoch": 0.02, "learning_rate": 1.0445859872611466e-05, "loss": 1.8574, "step": 574 }, { "epoch": 0.02, "learning_rate": 1.0464058234758871e-05, "loss": 1.623, "step": 575 }, { "epoch": 0.02, "learning_rate": 1.0482256596906279e-05, "loss": 1.7129, "step": 576 }, { "epoch": 0.02, "learning_rate": 1.0500454959053686e-05, "loss": 1.875, "step": 577 }, { "epoch": 0.02, "learning_rate": 1.0518653321201093e-05, "loss": 1.6235, "step": 578 }, { "epoch": 0.02, "learning_rate": 1.0536851683348499e-05, "loss": 1.7051, "step": 579 }, { "epoch": 0.02, "learning_rate": 1.0555050045495906e-05, "loss": 1.5825, "step": 580 }, { "epoch": 0.02, "learning_rate": 1.0573248407643314e-05, "loss": 1.7097, "step": 581 }, { "epoch": 0.02, "learning_rate": 1.059144676979072e-05, "loss": 1.7388, "step": 582 }, { "epoch": 0.02, "learning_rate": 1.0609645131938127e-05, "loss": 1.7056, "step": 583 }, { "epoch": 0.02, "learning_rate": 1.0627843494085532e-05, "loss": 1.8604, "step": 584 }, { "epoch": 0.02, "learning_rate": 1.064604185623294e-05, "loss": 1.7258, "step": 585 }, { "epoch": 0.02, "learning_rate": 1.0664240218380347e-05, "loss": 1.7637, "step": 586 }, { "epoch": 0.02, "learning_rate": 1.0682438580527754e-05, "loss": 1.5864, "step": 587 }, { "epoch": 0.02, "learning_rate": 1.070063694267516e-05, "loss": 1.7246, "step": 588 }, { "epoch": 0.02, "learning_rate": 1.0718835304822567e-05, "loss": 1.6831, "step": 589 }, { "epoch": 0.02, "learning_rate": 1.0737033666969974e-05, "loss": 1.8955, "step": 590 }, { "epoch": 0.02, "learning_rate": 1.075523202911738e-05, "loss": 1.6904, "step": 591 }, { "epoch": 0.02, "learning_rate": 1.0773430391264787e-05, "loss": 1.6011, "step": 592 }, { "epoch": 0.02, "learning_rate": 1.0791628753412193e-05, "loss": 1.7402, "step": 593 }, { "epoch": 0.02, "learning_rate": 1.0809827115559602e-05, "loss": 1.8286, "step": 594 }, { "epoch": 0.02, "learning_rate": 1.0828025477707008e-05, "loss": 1.7305, "step": 595 }, { "epoch": 0.02, "learning_rate": 1.0846223839854415e-05, "loss": 1.8359, "step": 596 }, { "epoch": 0.02, "learning_rate": 1.086442220200182e-05, "loss": 1.8008, "step": 597 }, { "epoch": 0.02, "learning_rate": 1.0882620564149226e-05, "loss": 1.856, "step": 598 }, { "epoch": 0.02, "learning_rate": 1.0900818926296635e-05, "loss": 1.7168, "step": 599 }, { "epoch": 0.02, "learning_rate": 1.0919017288444041e-05, "loss": 1.7964, "step": 600 }, { "epoch": 0.02, "learning_rate": 1.0937215650591448e-05, "loss": 1.6929, "step": 601 }, { "epoch": 0.02, "learning_rate": 1.0955414012738854e-05, "loss": 1.7041, "step": 602 }, { "epoch": 0.02, "learning_rate": 1.0973612374886263e-05, "loss": 1.8203, "step": 603 }, { "epoch": 0.02, "learning_rate": 1.0991810737033669e-05, "loss": 1.6255, "step": 604 }, { "epoch": 0.02, "learning_rate": 1.1010009099181074e-05, "loss": 1.853, "step": 605 }, { "epoch": 0.02, "learning_rate": 1.1028207461328481e-05, "loss": 1.8892, "step": 606 }, { "epoch": 0.02, "learning_rate": 1.1046405823475887e-05, "loss": 1.7031, "step": 607 }, { "epoch": 0.02, "learning_rate": 1.1064604185623296e-05, "loss": 1.6162, "step": 608 }, { "epoch": 0.02, "learning_rate": 1.1082802547770702e-05, "loss": 1.7031, "step": 609 }, { "epoch": 0.02, "learning_rate": 1.1101000909918109e-05, "loss": 1.6489, "step": 610 }, { "epoch": 0.02, "learning_rate": 1.1119199272065515e-05, "loss": 1.751, "step": 611 }, { "epoch": 0.02, "learning_rate": 1.113739763421292e-05, "loss": 1.6062, "step": 612 }, { "epoch": 0.02, "learning_rate": 1.115559599636033e-05, "loss": 1.832, "step": 613 }, { "epoch": 0.02, "learning_rate": 1.1173794358507735e-05, "loss": 1.6895, "step": 614 }, { "epoch": 0.02, "learning_rate": 1.1191992720655142e-05, "loss": 1.665, "step": 615 }, { "epoch": 0.02, "learning_rate": 1.1210191082802548e-05, "loss": 1.708, "step": 616 }, { "epoch": 0.02, "learning_rate": 1.1228389444949957e-05, "loss": 1.6782, "step": 617 }, { "epoch": 0.02, "learning_rate": 1.1246587807097363e-05, "loss": 1.7412, "step": 618 }, { "epoch": 0.02, "learning_rate": 1.1264786169244768e-05, "loss": 1.8276, "step": 619 }, { "epoch": 0.02, "learning_rate": 1.1282984531392176e-05, "loss": 1.6145, "step": 620 }, { "epoch": 0.02, "learning_rate": 1.1301182893539581e-05, "loss": 1.6494, "step": 621 }, { "epoch": 0.02, "learning_rate": 1.131938125568699e-05, "loss": 1.6948, "step": 622 }, { "epoch": 0.02, "learning_rate": 1.1337579617834396e-05, "loss": 1.554, "step": 623 }, { "epoch": 0.02, "learning_rate": 1.1355777979981803e-05, "loss": 1.7192, "step": 624 }, { "epoch": 0.02, "learning_rate": 1.1373976342129209e-05, "loss": 1.7358, "step": 625 }, { "epoch": 0.02, "learning_rate": 1.1392174704276614e-05, "loss": 1.7959, "step": 626 }, { "epoch": 0.02, "learning_rate": 1.1410373066424023e-05, "loss": 1.7437, "step": 627 }, { "epoch": 0.02, "learning_rate": 1.1428571428571429e-05, "loss": 1.7363, "step": 628 }, { "epoch": 0.02, "learning_rate": 1.1446769790718836e-05, "loss": 1.8486, "step": 629 }, { "epoch": 0.02, "learning_rate": 1.1464968152866242e-05, "loss": 1.6592, "step": 630 }, { "epoch": 0.02, "learning_rate": 1.1483166515013651e-05, "loss": 1.8506, "step": 631 }, { "epoch": 0.02, "learning_rate": 1.1501364877161057e-05, "loss": 1.7295, "step": 632 }, { "epoch": 0.02, "learning_rate": 1.1519563239308462e-05, "loss": 1.752, "step": 633 }, { "epoch": 0.02, "learning_rate": 1.153776160145587e-05, "loss": 1.7578, "step": 634 }, { "epoch": 0.02, "learning_rate": 1.1555959963603275e-05, "loss": 1.5137, "step": 635 }, { "epoch": 0.02, "learning_rate": 1.1574158325750684e-05, "loss": 1.7734, "step": 636 }, { "epoch": 0.02, "learning_rate": 1.159235668789809e-05, "loss": 1.7744, "step": 637 }, { "epoch": 0.02, "learning_rate": 1.1610555050045497e-05, "loss": 1.6162, "step": 638 }, { "epoch": 0.02, "learning_rate": 1.1628753412192903e-05, "loss": 1.6572, "step": 639 }, { "epoch": 0.02, "learning_rate": 1.164695177434031e-05, "loss": 1.6416, "step": 640 }, { "epoch": 0.02, "learning_rate": 1.1665150136487717e-05, "loss": 1.7671, "step": 641 }, { "epoch": 0.02, "learning_rate": 1.1683348498635123e-05, "loss": 1.7041, "step": 642 }, { "epoch": 0.02, "learning_rate": 1.170154686078253e-05, "loss": 1.604, "step": 643 }, { "epoch": 0.02, "learning_rate": 1.1719745222929938e-05, "loss": 1.7427, "step": 644 }, { "epoch": 0.02, "learning_rate": 1.1737943585077345e-05, "loss": 1.6924, "step": 645 }, { "epoch": 0.02, "learning_rate": 1.175614194722475e-05, "loss": 2.0034, "step": 646 }, { "epoch": 0.02, "learning_rate": 1.1774340309372156e-05, "loss": 1.6909, "step": 647 }, { "epoch": 0.02, "learning_rate": 1.1792538671519564e-05, "loss": 1.8018, "step": 648 }, { "epoch": 0.02, "learning_rate": 1.1810737033666971e-05, "loss": 1.8428, "step": 649 }, { "epoch": 0.02, "learning_rate": 1.1828935395814378e-05, "loss": 1.8306, "step": 650 }, { "epoch": 0.02, "learning_rate": 1.1847133757961784e-05, "loss": 1.8848, "step": 651 }, { "epoch": 0.02, "learning_rate": 1.1865332120109191e-05, "loss": 1.5693, "step": 652 }, { "epoch": 0.02, "learning_rate": 1.1883530482256599e-05, "loss": 1.7695, "step": 653 }, { "epoch": 0.02, "learning_rate": 1.1901728844404004e-05, "loss": 1.8486, "step": 654 }, { "epoch": 0.02, "learning_rate": 1.1919927206551411e-05, "loss": 1.7178, "step": 655 }, { "epoch": 0.02, "learning_rate": 1.1938125568698817e-05, "loss": 1.7881, "step": 656 }, { "epoch": 0.02, "learning_rate": 1.1956323930846226e-05, "loss": 1.707, "step": 657 }, { "epoch": 0.02, "learning_rate": 1.1974522292993632e-05, "loss": 1.5686, "step": 658 }, { "epoch": 0.02, "learning_rate": 1.1992720655141039e-05, "loss": 1.7446, "step": 659 }, { "epoch": 0.02, "learning_rate": 1.2010919017288445e-05, "loss": 1.6201, "step": 660 }, { "epoch": 0.02, "learning_rate": 1.202911737943585e-05, "loss": 1.6938, "step": 661 }, { "epoch": 0.02, "learning_rate": 1.204731574158326e-05, "loss": 1.4912, "step": 662 }, { "epoch": 0.02, "learning_rate": 1.2065514103730665e-05, "loss": 1.7324, "step": 663 }, { "epoch": 0.02, "learning_rate": 1.2083712465878072e-05, "loss": 1.6958, "step": 664 }, { "epoch": 0.02, "learning_rate": 1.2101910828025478e-05, "loss": 1.814, "step": 665 }, { "epoch": 0.02, "learning_rate": 1.2120109190172887e-05, "loss": 1.7954, "step": 666 }, { "epoch": 0.02, "learning_rate": 1.2138307552320293e-05, "loss": 1.6733, "step": 667 }, { "epoch": 0.02, "learning_rate": 1.21565059144677e-05, "loss": 1.9956, "step": 668 }, { "epoch": 0.02, "learning_rate": 1.2174704276615106e-05, "loss": 1.6987, "step": 669 }, { "epoch": 0.02, "learning_rate": 1.2192902638762511e-05, "loss": 1.7983, "step": 670 }, { "epoch": 0.02, "learning_rate": 1.221110100090992e-05, "loss": 1.6509, "step": 671 }, { "epoch": 0.02, "learning_rate": 1.2229299363057326e-05, "loss": 1.6543, "step": 672 }, { "epoch": 0.02, "learning_rate": 1.2247497725204733e-05, "loss": 1.6162, "step": 673 }, { "epoch": 0.02, "learning_rate": 1.2265696087352139e-05, "loss": 1.7314, "step": 674 }, { "epoch": 0.02, "learning_rate": 1.2283894449499548e-05, "loss": 1.6765, "step": 675 }, { "epoch": 0.02, "learning_rate": 1.2302092811646953e-05, "loss": 1.7549, "step": 676 }, { "epoch": 0.02, "learning_rate": 1.2320291173794359e-05, "loss": 1.6445, "step": 677 }, { "epoch": 0.02, "learning_rate": 1.2338489535941766e-05, "loss": 1.7578, "step": 678 }, { "epoch": 0.02, "learning_rate": 1.2356687898089172e-05, "loss": 1.6423, "step": 679 }, { "epoch": 0.02, "learning_rate": 1.2374886260236581e-05, "loss": 1.6543, "step": 680 }, { "epoch": 0.02, "learning_rate": 1.2393084622383987e-05, "loss": 1.7368, "step": 681 }, { "epoch": 0.02, "learning_rate": 1.2411282984531394e-05, "loss": 1.7148, "step": 682 }, { "epoch": 0.02, "learning_rate": 1.24294813466788e-05, "loss": 1.6567, "step": 683 }, { "epoch": 0.02, "learning_rate": 1.2447679708826205e-05, "loss": 1.6782, "step": 684 }, { "epoch": 0.02, "learning_rate": 1.2465878070973614e-05, "loss": 1.7451, "step": 685 }, { "epoch": 0.02, "learning_rate": 1.248407643312102e-05, "loss": 1.7974, "step": 686 }, { "epoch": 0.02, "learning_rate": 1.2502274795268427e-05, "loss": 1.4609, "step": 687 }, { "epoch": 0.02, "learning_rate": 1.2520473157415833e-05, "loss": 1.7168, "step": 688 }, { "epoch": 0.02, "learning_rate": 1.2538671519563242e-05, "loss": 1.6641, "step": 689 }, { "epoch": 0.02, "learning_rate": 1.2556869881710647e-05, "loss": 1.7764, "step": 690 }, { "epoch": 0.02, "learning_rate": 1.2575068243858053e-05, "loss": 1.6611, "step": 691 }, { "epoch": 0.02, "learning_rate": 1.259326660600546e-05, "loss": 1.6455, "step": 692 }, { "epoch": 0.02, "learning_rate": 1.2611464968152866e-05, "loss": 1.7139, "step": 693 }, { "epoch": 0.02, "learning_rate": 1.2629663330300275e-05, "loss": 1.7949, "step": 694 }, { "epoch": 0.02, "learning_rate": 1.264786169244768e-05, "loss": 1.6826, "step": 695 }, { "epoch": 0.02, "learning_rate": 1.2666060054595088e-05, "loss": 1.8276, "step": 696 }, { "epoch": 0.02, "learning_rate": 1.2684258416742494e-05, "loss": 1.5293, "step": 697 }, { "epoch": 0.02, "learning_rate": 1.27024567788899e-05, "loss": 1.7456, "step": 698 }, { "epoch": 0.02, "learning_rate": 1.2720655141037308e-05, "loss": 1.6978, "step": 699 }, { "epoch": 0.02, "learning_rate": 1.2738853503184714e-05, "loss": 1.7607, "step": 700 }, { "epoch": 0.02, "learning_rate": 1.2757051865332121e-05, "loss": 1.7344, "step": 701 }, { "epoch": 0.02, "learning_rate": 1.2775250227479527e-05, "loss": 1.6057, "step": 702 }, { "epoch": 0.02, "learning_rate": 1.2793448589626936e-05, "loss": 1.7578, "step": 703 }, { "epoch": 0.02, "learning_rate": 1.2811646951774341e-05, "loss": 1.7251, "step": 704 }, { "epoch": 0.02, "learning_rate": 1.2829845313921747e-05, "loss": 1.7676, "step": 705 }, { "epoch": 0.02, "learning_rate": 1.2848043676069154e-05, "loss": 1.6575, "step": 706 }, { "epoch": 0.02, "learning_rate": 1.2866242038216562e-05, "loss": 1.7314, "step": 707 }, { "epoch": 0.02, "learning_rate": 1.2884440400363969e-05, "loss": 1.7231, "step": 708 }, { "epoch": 0.02, "learning_rate": 1.2902638762511375e-05, "loss": 1.7559, "step": 709 }, { "epoch": 0.02, "learning_rate": 1.2920837124658782e-05, "loss": 1.7583, "step": 710 }, { "epoch": 0.02, "learning_rate": 1.293903548680619e-05, "loss": 1.5176, "step": 711 }, { "epoch": 0.02, "learning_rate": 1.2957233848953595e-05, "loss": 1.7109, "step": 712 }, { "epoch": 0.02, "learning_rate": 1.2975432211101002e-05, "loss": 1.6396, "step": 713 }, { "epoch": 0.02, "learning_rate": 1.2993630573248408e-05, "loss": 1.6394, "step": 714 }, { "epoch": 0.02, "learning_rate": 1.3011828935395815e-05, "loss": 1.5171, "step": 715 }, { "epoch": 0.02, "learning_rate": 1.3030027297543223e-05, "loss": 1.5908, "step": 716 }, { "epoch": 0.02, "learning_rate": 1.304822565969063e-05, "loss": 1.6733, "step": 717 }, { "epoch": 0.02, "learning_rate": 1.3066424021838036e-05, "loss": 1.7534, "step": 718 }, { "epoch": 0.02, "learning_rate": 1.3084622383985441e-05, "loss": 1.8389, "step": 719 }, { "epoch": 0.02, "learning_rate": 1.310282074613285e-05, "loss": 1.7925, "step": 720 }, { "epoch": 0.02, "learning_rate": 1.3121019108280256e-05, "loss": 1.7427, "step": 721 }, { "epoch": 0.02, "learning_rate": 1.3139217470427663e-05, "loss": 1.5298, "step": 722 }, { "epoch": 0.02, "learning_rate": 1.3157415832575069e-05, "loss": 1.7896, "step": 723 }, { "epoch": 0.02, "learning_rate": 1.3175614194722478e-05, "loss": 2.0142, "step": 724 }, { "epoch": 0.02, "learning_rate": 1.3193812556869883e-05, "loss": 1.7798, "step": 725 }, { "epoch": 0.02, "learning_rate": 1.3212010919017289e-05, "loss": 1.7603, "step": 726 }, { "epoch": 0.02, "learning_rate": 1.3230209281164696e-05, "loss": 1.6855, "step": 727 }, { "epoch": 0.02, "learning_rate": 1.3248407643312102e-05, "loss": 1.6753, "step": 728 }, { "epoch": 0.02, "learning_rate": 1.3266606005459511e-05, "loss": 1.5732, "step": 729 }, { "epoch": 0.02, "learning_rate": 1.3284804367606917e-05, "loss": 1.5698, "step": 730 }, { "epoch": 0.02, "learning_rate": 1.3303002729754324e-05, "loss": 1.8325, "step": 731 }, { "epoch": 0.02, "learning_rate": 1.332120109190173e-05, "loss": 1.5303, "step": 732 }, { "epoch": 0.02, "learning_rate": 1.3339399454049135e-05, "loss": 1.8164, "step": 733 }, { "epoch": 0.02, "learning_rate": 1.3357597816196544e-05, "loss": 1.7466, "step": 734 }, { "epoch": 0.02, "learning_rate": 1.337579617834395e-05, "loss": 1.731, "step": 735 }, { "epoch": 0.02, "learning_rate": 1.3393994540491357e-05, "loss": 1.614, "step": 736 }, { "epoch": 0.02, "learning_rate": 1.3412192902638763e-05, "loss": 1.5947, "step": 737 }, { "epoch": 0.02, "learning_rate": 1.3430391264786172e-05, "loss": 1.8369, "step": 738 }, { "epoch": 0.02, "learning_rate": 1.3448589626933577e-05, "loss": 1.8164, "step": 739 }, { "epoch": 0.02, "learning_rate": 1.3466787989080983e-05, "loss": 1.7983, "step": 740 }, { "epoch": 0.02, "learning_rate": 1.348498635122839e-05, "loss": 1.6396, "step": 741 }, { "epoch": 0.02, "learning_rate": 1.3503184713375796e-05, "loss": 1.7295, "step": 742 }, { "epoch": 0.02, "learning_rate": 1.3521383075523205e-05, "loss": 1.6763, "step": 743 }, { "epoch": 0.02, "learning_rate": 1.353958143767061e-05, "loss": 1.8022, "step": 744 }, { "epoch": 0.02, "learning_rate": 1.3557779799818018e-05, "loss": 1.7793, "step": 745 }, { "epoch": 0.02, "learning_rate": 1.3575978161965424e-05, "loss": 1.6631, "step": 746 }, { "epoch": 0.02, "learning_rate": 1.3594176524112833e-05, "loss": 1.5811, "step": 747 }, { "epoch": 0.02, "learning_rate": 1.3612374886260238e-05, "loss": 1.8394, "step": 748 }, { "epoch": 0.02, "learning_rate": 1.3630573248407644e-05, "loss": 1.6646, "step": 749 }, { "epoch": 0.02, "learning_rate": 1.3648771610555051e-05, "loss": 1.6851, "step": 750 }, { "epoch": 0.02, "learning_rate": 1.3666969972702457e-05, "loss": 1.6287, "step": 751 }, { "epoch": 0.02, "learning_rate": 1.3685168334849866e-05, "loss": 1.707, "step": 752 }, { "epoch": 0.02, "learning_rate": 1.3703366696997271e-05, "loss": 1.8408, "step": 753 }, { "epoch": 0.02, "learning_rate": 1.3721565059144679e-05, "loss": 1.6772, "step": 754 }, { "epoch": 0.02, "learning_rate": 1.3739763421292084e-05, "loss": 1.7188, "step": 755 }, { "epoch": 0.02, "learning_rate": 1.375796178343949e-05, "loss": 1.6865, "step": 756 }, { "epoch": 0.02, "learning_rate": 1.3776160145586899e-05, "loss": 1.5088, "step": 757 }, { "epoch": 0.02, "learning_rate": 1.3794358507734305e-05, "loss": 1.7007, "step": 758 }, { "epoch": 0.02, "learning_rate": 1.3812556869881712e-05, "loss": 1.6211, "step": 759 }, { "epoch": 0.02, "learning_rate": 1.3830755232029118e-05, "loss": 1.8335, "step": 760 }, { "epoch": 0.02, "learning_rate": 1.3848953594176527e-05, "loss": 1.7915, "step": 761 }, { "epoch": 0.02, "learning_rate": 1.3867151956323932e-05, "loss": 1.5679, "step": 762 }, { "epoch": 0.02, "learning_rate": 1.3885350318471338e-05, "loss": 1.5703, "step": 763 }, { "epoch": 0.02, "learning_rate": 1.3903548680618745e-05, "loss": 1.7695, "step": 764 }, { "epoch": 0.02, "learning_rate": 1.392174704276615e-05, "loss": 1.6709, "step": 765 }, { "epoch": 0.02, "learning_rate": 1.393994540491356e-05, "loss": 1.6501, "step": 766 }, { "epoch": 0.02, "learning_rate": 1.3958143767060965e-05, "loss": 1.7119, "step": 767 }, { "epoch": 0.02, "learning_rate": 1.3976342129208373e-05, "loss": 1.7041, "step": 768 }, { "epoch": 0.02, "learning_rate": 1.3994540491355778e-05, "loss": 1.8096, "step": 769 }, { "epoch": 0.02, "learning_rate": 1.4012738853503186e-05, "loss": 1.6997, "step": 770 }, { "epoch": 0.02, "learning_rate": 1.4030937215650593e-05, "loss": 1.5728, "step": 771 }, { "epoch": 0.02, "learning_rate": 1.4049135577797999e-05, "loss": 1.6362, "step": 772 }, { "epoch": 0.02, "learning_rate": 1.4067333939945406e-05, "loss": 1.7549, "step": 773 }, { "epoch": 0.02, "learning_rate": 1.4085532302092813e-05, "loss": 1.7305, "step": 774 }, { "epoch": 0.02, "learning_rate": 1.410373066424022e-05, "loss": 1.8042, "step": 775 }, { "epoch": 0.02, "learning_rate": 1.4121929026387626e-05, "loss": 1.7236, "step": 776 }, { "epoch": 0.02, "learning_rate": 1.4140127388535032e-05, "loss": 1.7124, "step": 777 }, { "epoch": 0.02, "learning_rate": 1.415832575068244e-05, "loss": 1.4917, "step": 778 }, { "epoch": 0.02, "learning_rate": 1.4176524112829847e-05, "loss": 1.7144, "step": 779 }, { "epoch": 0.02, "learning_rate": 1.4194722474977254e-05, "loss": 1.5745, "step": 780 }, { "epoch": 0.02, "learning_rate": 1.421292083712466e-05, "loss": 1.6592, "step": 781 }, { "epoch": 0.02, "learning_rate": 1.4231119199272067e-05, "loss": 1.6782, "step": 782 }, { "epoch": 0.02, "learning_rate": 1.4249317561419474e-05, "loss": 1.6086, "step": 783 }, { "epoch": 0.02, "learning_rate": 1.426751592356688e-05, "loss": 1.6909, "step": 784 }, { "epoch": 0.02, "learning_rate": 1.4285714285714287e-05, "loss": 1.8833, "step": 785 }, { "epoch": 0.02, "learning_rate": 1.4303912647861693e-05, "loss": 1.8994, "step": 786 }, { "epoch": 0.02, "learning_rate": 1.4322111010009102e-05, "loss": 1.7622, "step": 787 }, { "epoch": 0.02, "learning_rate": 1.4340309372156507e-05, "loss": 1.6392, "step": 788 }, { "epoch": 0.02, "learning_rate": 1.4358507734303915e-05, "loss": 1.7344, "step": 789 }, { "epoch": 0.02, "learning_rate": 1.437670609645132e-05, "loss": 1.6011, "step": 790 }, { "epoch": 0.02, "learning_rate": 1.4394904458598726e-05, "loss": 1.5776, "step": 791 }, { "epoch": 0.02, "learning_rate": 1.4413102820746135e-05, "loss": 1.6992, "step": 792 }, { "epoch": 0.02, "learning_rate": 1.443130118289354e-05, "loss": 1.6357, "step": 793 }, { "epoch": 0.02, "learning_rate": 1.4449499545040948e-05, "loss": 1.6602, "step": 794 }, { "epoch": 0.02, "learning_rate": 1.4467697907188354e-05, "loss": 1.5715, "step": 795 }, { "epoch": 0.02, "learning_rate": 1.4485896269335763e-05, "loss": 1.7363, "step": 796 }, { "epoch": 0.02, "learning_rate": 1.4504094631483168e-05, "loss": 1.7266, "step": 797 }, { "epoch": 0.02, "learning_rate": 1.4522292993630574e-05, "loss": 1.7117, "step": 798 }, { "epoch": 0.02, "learning_rate": 1.4540491355777981e-05, "loss": 1.4861, "step": 799 }, { "epoch": 0.02, "learning_rate": 1.4558689717925387e-05, "loss": 1.7725, "step": 800 }, { "epoch": 0.02, "learning_rate": 1.4576888080072796e-05, "loss": 1.6953, "step": 801 }, { "epoch": 0.02, "learning_rate": 1.4595086442220201e-05, "loss": 1.7456, "step": 802 }, { "epoch": 0.02, "learning_rate": 1.4613284804367609e-05, "loss": 1.7876, "step": 803 }, { "epoch": 0.02, "learning_rate": 1.4631483166515014e-05, "loss": 1.5869, "step": 804 }, { "epoch": 0.02, "learning_rate": 1.464968152866242e-05, "loss": 1.6421, "step": 805 }, { "epoch": 0.02, "learning_rate": 1.4667879890809829e-05, "loss": 1.832, "step": 806 }, { "epoch": 0.02, "learning_rate": 1.4686078252957235e-05, "loss": 1.853, "step": 807 }, { "epoch": 0.02, "learning_rate": 1.4704276615104642e-05, "loss": 1.75, "step": 808 }, { "epoch": 0.02, "learning_rate": 1.4722474977252048e-05, "loss": 1.6318, "step": 809 }, { "epoch": 0.02, "learning_rate": 1.4740673339399457e-05, "loss": 1.6924, "step": 810 }, { "epoch": 0.02, "learning_rate": 1.4758871701546862e-05, "loss": 1.667, "step": 811 }, { "epoch": 0.02, "learning_rate": 1.4777070063694268e-05, "loss": 1.6025, "step": 812 }, { "epoch": 0.02, "learning_rate": 1.4795268425841675e-05, "loss": 1.7002, "step": 813 }, { "epoch": 0.02, "learning_rate": 1.481346678798908e-05, "loss": 1.709, "step": 814 }, { "epoch": 0.02, "learning_rate": 1.483166515013649e-05, "loss": 1.6138, "step": 815 }, { "epoch": 0.02, "learning_rate": 1.4849863512283895e-05, "loss": 1.5864, "step": 816 }, { "epoch": 0.02, "learning_rate": 1.4868061874431303e-05, "loss": 1.7212, "step": 817 }, { "epoch": 0.02, "learning_rate": 1.4886260236578708e-05, "loss": 1.6406, "step": 818 }, { "epoch": 0.02, "learning_rate": 1.4904458598726114e-05, "loss": 1.7178, "step": 819 }, { "epoch": 0.02, "learning_rate": 1.4922656960873523e-05, "loss": 1.5891, "step": 820 }, { "epoch": 0.02, "learning_rate": 1.4940855323020929e-05, "loss": 1.6123, "step": 821 }, { "epoch": 0.02, "learning_rate": 1.4959053685168336e-05, "loss": 1.7097, "step": 822 }, { "epoch": 0.02, "learning_rate": 1.4977252047315742e-05, "loss": 1.686, "step": 823 }, { "epoch": 0.02, "learning_rate": 1.499545040946315e-05, "loss": 1.707, "step": 824 }, { "epoch": 0.02, "learning_rate": 1.5013648771610556e-05, "loss": 1.7334, "step": 825 }, { "epoch": 0.02, "learning_rate": 1.5031847133757964e-05, "loss": 1.854, "step": 826 }, { "epoch": 0.02, "learning_rate": 1.505004549590537e-05, "loss": 1.7129, "step": 827 }, { "epoch": 0.02, "learning_rate": 1.5068243858052775e-05, "loss": 1.582, "step": 828 }, { "epoch": 0.02, "learning_rate": 1.5086442220200184e-05, "loss": 1.5151, "step": 829 }, { "epoch": 0.02, "learning_rate": 1.510464058234759e-05, "loss": 1.7153, "step": 830 }, { "epoch": 0.02, "learning_rate": 1.5122838944494997e-05, "loss": 1.6196, "step": 831 }, { "epoch": 0.02, "learning_rate": 1.5141037306642402e-05, "loss": 1.3193, "step": 832 }, { "epoch": 0.02, "learning_rate": 1.5159235668789811e-05, "loss": 1.6919, "step": 833 }, { "epoch": 0.02, "learning_rate": 1.5177434030937217e-05, "loss": 1.718, "step": 834 }, { "epoch": 0.02, "learning_rate": 1.5195632393084623e-05, "loss": 1.8271, "step": 835 }, { "epoch": 0.02, "learning_rate": 1.521383075523203e-05, "loss": 1.7095, "step": 836 }, { "epoch": 0.02, "learning_rate": 1.5232029117379437e-05, "loss": 1.6343, "step": 837 }, { "epoch": 0.02, "learning_rate": 1.5250227479526845e-05, "loss": 1.5757, "step": 838 }, { "epoch": 0.02, "learning_rate": 1.526842584167425e-05, "loss": 1.6992, "step": 839 }, { "epoch": 0.02, "learning_rate": 1.528662420382166e-05, "loss": 1.8604, "step": 840 }, { "epoch": 0.02, "learning_rate": 1.5304822565969065e-05, "loss": 1.7642, "step": 841 }, { "epoch": 0.02, "learning_rate": 1.532302092811647e-05, "loss": 1.7349, "step": 842 }, { "epoch": 0.02, "learning_rate": 1.5341219290263876e-05, "loss": 1.6255, "step": 843 }, { "epoch": 0.02, "learning_rate": 1.5359417652411285e-05, "loss": 1.6143, "step": 844 }, { "epoch": 0.02, "learning_rate": 1.537761601455869e-05, "loss": 1.687, "step": 845 }, { "epoch": 0.02, "learning_rate": 1.5395814376706097e-05, "loss": 1.6729, "step": 846 }, { "epoch": 0.02, "learning_rate": 1.5414012738853506e-05, "loss": 1.7275, "step": 847 }, { "epoch": 0.02, "learning_rate": 1.543221110100091e-05, "loss": 1.9697, "step": 848 }, { "epoch": 0.02, "learning_rate": 1.5450409463148317e-05, "loss": 1.6768, "step": 849 }, { "epoch": 0.02, "learning_rate": 1.5468607825295726e-05, "loss": 1.8364, "step": 850 }, { "epoch": 0.02, "learning_rate": 1.548680618744313e-05, "loss": 1.5547, "step": 851 }, { "epoch": 0.02, "learning_rate": 1.550500454959054e-05, "loss": 1.5278, "step": 852 }, { "epoch": 0.02, "learning_rate": 1.5523202911737946e-05, "loss": 1.6289, "step": 853 }, { "epoch": 0.02, "learning_rate": 1.5541401273885352e-05, "loss": 1.6216, "step": 854 }, { "epoch": 0.02, "learning_rate": 1.5559599636032757e-05, "loss": 1.8296, "step": 855 }, { "epoch": 0.02, "learning_rate": 1.5577797998180163e-05, "loss": 1.689, "step": 856 }, { "epoch": 0.02, "learning_rate": 1.5595996360327572e-05, "loss": 1.5972, "step": 857 }, { "epoch": 0.02, "learning_rate": 1.5614194722474978e-05, "loss": 1.6094, "step": 858 }, { "epoch": 0.02, "learning_rate": 1.5632393084622387e-05, "loss": 1.5786, "step": 859 }, { "epoch": 0.02, "learning_rate": 1.5650591446769792e-05, "loss": 1.708, "step": 860 }, { "epoch": 0.02, "learning_rate": 1.56687898089172e-05, "loss": 1.6338, "step": 861 }, { "epoch": 0.02, "learning_rate": 1.5686988171064607e-05, "loss": 1.6802, "step": 862 }, { "epoch": 0.02, "learning_rate": 1.5705186533212013e-05, "loss": 1.6382, "step": 863 }, { "epoch": 0.02, "learning_rate": 1.5723384895359418e-05, "loss": 1.624, "step": 864 }, { "epoch": 0.02, "learning_rate": 1.5741583257506824e-05, "loss": 1.4844, "step": 865 }, { "epoch": 0.02, "learning_rate": 1.5759781619654233e-05, "loss": 1.6465, "step": 866 }, { "epoch": 0.02, "learning_rate": 1.577797998180164e-05, "loss": 1.6704, "step": 867 }, { "epoch": 0.02, "learning_rate": 1.5796178343949047e-05, "loss": 1.6113, "step": 868 }, { "epoch": 0.02, "learning_rate": 1.5814376706096453e-05, "loss": 1.7158, "step": 869 }, { "epoch": 0.02, "learning_rate": 1.583257506824386e-05, "loss": 1.5703, "step": 870 }, { "epoch": 0.02, "learning_rate": 1.5850773430391268e-05, "loss": 1.7524, "step": 871 }, { "epoch": 0.02, "learning_rate": 1.5868971792538673e-05, "loss": 1.6128, "step": 872 }, { "epoch": 0.02, "learning_rate": 1.588717015468608e-05, "loss": 1.7261, "step": 873 }, { "epoch": 0.02, "learning_rate": 1.5905368516833485e-05, "loss": 1.6851, "step": 874 }, { "epoch": 0.02, "learning_rate": 1.5923566878980894e-05, "loss": 1.6362, "step": 875 }, { "epoch": 0.02, "learning_rate": 1.59417652411283e-05, "loss": 1.6152, "step": 876 }, { "epoch": 0.02, "learning_rate": 1.5959963603275705e-05, "loss": 1.8096, "step": 877 }, { "epoch": 0.02, "learning_rate": 1.5978161965423114e-05, "loss": 1.7358, "step": 878 }, { "epoch": 0.02, "learning_rate": 1.599636032757052e-05, "loss": 1.8105, "step": 879 }, { "epoch": 0.02, "learning_rate": 1.601455868971793e-05, "loss": 1.606, "step": 880 }, { "epoch": 0.02, "learning_rate": 1.6032757051865334e-05, "loss": 1.5742, "step": 881 }, { "epoch": 0.02, "learning_rate": 1.605095541401274e-05, "loss": 1.7314, "step": 882 }, { "epoch": 0.02, "learning_rate": 1.6069153776160145e-05, "loss": 1.6938, "step": 883 }, { "epoch": 0.02, "learning_rate": 1.608735213830755e-05, "loss": 1.6846, "step": 884 }, { "epoch": 0.02, "learning_rate": 1.610555050045496e-05, "loss": 1.668, "step": 885 }, { "epoch": 0.02, "learning_rate": 1.6123748862602366e-05, "loss": 1.6738, "step": 886 }, { "epoch": 0.02, "learning_rate": 1.6141947224749775e-05, "loss": 1.6431, "step": 887 }, { "epoch": 0.02, "learning_rate": 1.616014558689718e-05, "loss": 1.8218, "step": 888 }, { "epoch": 0.02, "learning_rate": 1.617834394904459e-05, "loss": 1.8979, "step": 889 }, { "epoch": 0.02, "learning_rate": 1.6196542311191995e-05, "loss": 1.7241, "step": 890 }, { "epoch": 0.02, "learning_rate": 1.62147406733394e-05, "loss": 1.7324, "step": 891 }, { "epoch": 0.02, "learning_rate": 1.6232939035486806e-05, "loss": 1.7695, "step": 892 }, { "epoch": 0.02, "learning_rate": 1.6251137397634212e-05, "loss": 1.646, "step": 893 }, { "epoch": 0.02, "learning_rate": 1.626933575978162e-05, "loss": 1.6265, "step": 894 }, { "epoch": 0.02, "learning_rate": 1.6287534121929026e-05, "loss": 1.77, "step": 895 }, { "epoch": 0.02, "learning_rate": 1.6305732484076436e-05, "loss": 1.6343, "step": 896 }, { "epoch": 0.02, "learning_rate": 1.632393084622384e-05, "loss": 1.791, "step": 897 }, { "epoch": 0.02, "learning_rate": 1.6342129208371247e-05, "loss": 1.7959, "step": 898 }, { "epoch": 0.02, "learning_rate": 1.6360327570518656e-05, "loss": 1.5366, "step": 899 }, { "epoch": 0.02, "learning_rate": 1.637852593266606e-05, "loss": 1.7461, "step": 900 }, { "epoch": 0.02, "learning_rate": 1.6396724294813467e-05, "loss": 1.7241, "step": 901 }, { "epoch": 0.02, "learning_rate": 1.6414922656960876e-05, "loss": 1.5913, "step": 902 }, { "epoch": 0.02, "learning_rate": 1.643312101910828e-05, "loss": 1.5698, "step": 903 }, { "epoch": 0.02, "learning_rate": 1.6451319381255687e-05, "loss": 1.8135, "step": 904 }, { "epoch": 0.02, "learning_rate": 1.6469517743403096e-05, "loss": 1.5627, "step": 905 }, { "epoch": 0.02, "learning_rate": 1.6487716105550502e-05, "loss": 1.5908, "step": 906 }, { "epoch": 0.02, "learning_rate": 1.6505914467697908e-05, "loss": 1.7427, "step": 907 }, { "epoch": 0.02, "learning_rate": 1.6524112829845317e-05, "loss": 1.6074, "step": 908 }, { "epoch": 0.02, "learning_rate": 1.6542311191992722e-05, "loss": 1.6519, "step": 909 }, { "epoch": 0.02, "learning_rate": 1.6560509554140128e-05, "loss": 1.6323, "step": 910 }, { "epoch": 0.02, "learning_rate": 1.6578707916287537e-05, "loss": 1.6909, "step": 911 }, { "epoch": 0.02, "learning_rate": 1.6596906278434943e-05, "loss": 1.6787, "step": 912 }, { "epoch": 0.02, "learning_rate": 1.6615104640582348e-05, "loss": 1.6548, "step": 913 }, { "epoch": 0.02, "learning_rate": 1.6633303002729754e-05, "loss": 1.6992, "step": 914 }, { "epoch": 0.02, "learning_rate": 1.6651501364877163e-05, "loss": 1.7227, "step": 915 }, { "epoch": 0.03, "learning_rate": 1.666969972702457e-05, "loss": 1.6699, "step": 916 }, { "epoch": 0.03, "learning_rate": 1.6687898089171977e-05, "loss": 1.6333, "step": 917 }, { "epoch": 0.03, "learning_rate": 1.6706096451319383e-05, "loss": 1.6934, "step": 918 }, { "epoch": 0.03, "learning_rate": 1.6724294813466792e-05, "loss": 1.7041, "step": 919 }, { "epoch": 0.03, "learning_rate": 1.6742493175614198e-05, "loss": 1.5173, "step": 920 }, { "epoch": 0.03, "learning_rate": 1.6760691537761603e-05, "loss": 1.5923, "step": 921 }, { "epoch": 0.03, "learning_rate": 1.677888989990901e-05, "loss": 1.625, "step": 922 }, { "epoch": 0.03, "learning_rate": 1.6797088262056415e-05, "loss": 1.709, "step": 923 }, { "epoch": 0.03, "learning_rate": 1.6815286624203824e-05, "loss": 1.7246, "step": 924 }, { "epoch": 0.03, "learning_rate": 1.683348498635123e-05, "loss": 1.5835, "step": 925 }, { "epoch": 0.03, "learning_rate": 1.6851683348498638e-05, "loss": 1.6211, "step": 926 }, { "epoch": 0.03, "learning_rate": 1.6869881710646044e-05, "loss": 1.7192, "step": 927 }, { "epoch": 0.03, "learning_rate": 1.688808007279345e-05, "loss": 1.6191, "step": 928 }, { "epoch": 0.03, "learning_rate": 1.690627843494086e-05, "loss": 1.5234, "step": 929 }, { "epoch": 0.03, "learning_rate": 1.6924476797088264e-05, "loss": 1.5371, "step": 930 }, { "epoch": 0.03, "learning_rate": 1.694267515923567e-05, "loss": 1.5693, "step": 931 }, { "epoch": 0.03, "learning_rate": 1.6960873521383075e-05, "loss": 1.5376, "step": 932 }, { "epoch": 0.03, "learning_rate": 1.6979071883530484e-05, "loss": 1.8384, "step": 933 }, { "epoch": 0.03, "learning_rate": 1.699727024567789e-05, "loss": 1.6523, "step": 934 }, { "epoch": 0.03, "learning_rate": 1.7015468607825296e-05, "loss": 1.6172, "step": 935 }, { "epoch": 0.03, "learning_rate": 1.7033666969972705e-05, "loss": 1.5581, "step": 936 }, { "epoch": 0.03, "learning_rate": 1.705186533212011e-05, "loss": 1.6692, "step": 937 }, { "epoch": 0.03, "learning_rate": 1.707006369426752e-05, "loss": 1.7764, "step": 938 }, { "epoch": 0.03, "learning_rate": 1.7088262056414925e-05, "loss": 1.6218, "step": 939 }, { "epoch": 0.03, "learning_rate": 1.710646041856233e-05, "loss": 1.6333, "step": 940 }, { "epoch": 0.03, "learning_rate": 1.7124658780709736e-05, "loss": 1.5449, "step": 941 }, { "epoch": 0.03, "learning_rate": 1.7142857142857142e-05, "loss": 1.481, "step": 942 }, { "epoch": 0.03, "learning_rate": 1.716105550500455e-05, "loss": 1.6582, "step": 943 }, { "epoch": 0.03, "learning_rate": 1.7179253867151956e-05, "loss": 1.6836, "step": 944 }, { "epoch": 0.03, "learning_rate": 1.7197452229299365e-05, "loss": 1.6072, "step": 945 }, { "epoch": 0.03, "learning_rate": 1.721565059144677e-05, "loss": 1.6694, "step": 946 }, { "epoch": 0.03, "learning_rate": 1.723384895359418e-05, "loss": 1.6426, "step": 947 }, { "epoch": 0.03, "learning_rate": 1.7252047315741586e-05, "loss": 1.5459, "step": 948 }, { "epoch": 0.03, "learning_rate": 1.727024567788899e-05, "loss": 1.6777, "step": 949 }, { "epoch": 0.03, "learning_rate": 1.7288444040036397e-05, "loss": 1.894, "step": 950 }, { "epoch": 0.03, "learning_rate": 1.7306642402183803e-05, "loss": 1.5796, "step": 951 }, { "epoch": 0.03, "learning_rate": 1.732484076433121e-05, "loss": 1.5698, "step": 952 }, { "epoch": 0.03, "learning_rate": 1.7343039126478617e-05, "loss": 1.6328, "step": 953 }, { "epoch": 0.03, "learning_rate": 1.7361237488626026e-05, "loss": 1.7642, "step": 954 }, { "epoch": 0.03, "learning_rate": 1.7379435850773432e-05, "loss": 1.6274, "step": 955 }, { "epoch": 0.03, "learning_rate": 1.7397634212920838e-05, "loss": 1.5046, "step": 956 }, { "epoch": 0.03, "learning_rate": 1.7415832575068247e-05, "loss": 1.7622, "step": 957 }, { "epoch": 0.03, "learning_rate": 1.7434030937215652e-05, "loss": 1.7241, "step": 958 }, { "epoch": 0.03, "learning_rate": 1.7452229299363058e-05, "loss": 1.678, "step": 959 }, { "epoch": 0.03, "learning_rate": 1.7470427661510463e-05, "loss": 1.5757, "step": 960 }, { "epoch": 0.03, "learning_rate": 1.7488626023657872e-05, "loss": 1.6741, "step": 961 }, { "epoch": 0.03, "learning_rate": 1.7506824385805278e-05, "loss": 1.9556, "step": 962 }, { "epoch": 0.03, "learning_rate": 1.7525022747952684e-05, "loss": 1.6633, "step": 963 }, { "epoch": 0.03, "learning_rate": 1.7543221110100093e-05, "loss": 1.5986, "step": 964 }, { "epoch": 0.03, "learning_rate": 1.75614194722475e-05, "loss": 1.6421, "step": 965 }, { "epoch": 0.03, "learning_rate": 1.7579617834394907e-05, "loss": 1.7395, "step": 966 }, { "epoch": 0.03, "learning_rate": 1.7597816196542313e-05, "loss": 1.5757, "step": 967 }, { "epoch": 0.03, "learning_rate": 1.761601455868972e-05, "loss": 1.8057, "step": 968 }, { "epoch": 0.03, "learning_rate": 1.7634212920837128e-05, "loss": 1.6963, "step": 969 }, { "epoch": 0.03, "learning_rate": 1.7652411282984533e-05, "loss": 1.7212, "step": 970 }, { "epoch": 0.03, "learning_rate": 1.767060964513194e-05, "loss": 1.5488, "step": 971 }, { "epoch": 0.03, "learning_rate": 1.7688808007279345e-05, "loss": 1.8647, "step": 972 }, { "epoch": 0.03, "learning_rate": 1.7707006369426754e-05, "loss": 1.6846, "step": 973 }, { "epoch": 0.03, "learning_rate": 1.772520473157416e-05, "loss": 1.6416, "step": 974 }, { "epoch": 0.03, "learning_rate": 1.7743403093721568e-05, "loss": 1.6748, "step": 975 }, { "epoch": 0.03, "learning_rate": 1.7761601455868974e-05, "loss": 1.6631, "step": 976 }, { "epoch": 0.03, "learning_rate": 1.777979981801638e-05, "loss": 1.6072, "step": 977 }, { "epoch": 0.03, "learning_rate": 1.779799818016379e-05, "loss": 1.6348, "step": 978 }, { "epoch": 0.03, "learning_rate": 1.7816196542311194e-05, "loss": 1.5864, "step": 979 }, { "epoch": 0.03, "learning_rate": 1.78343949044586e-05, "loss": 1.6516, "step": 980 }, { "epoch": 0.03, "learning_rate": 1.7852593266606005e-05, "loss": 1.5693, "step": 981 }, { "epoch": 0.03, "learning_rate": 1.7870791628753414e-05, "loss": 1.6436, "step": 982 }, { "epoch": 0.03, "learning_rate": 1.788898999090082e-05, "loss": 1.4736, "step": 983 }, { "epoch": 0.03, "learning_rate": 1.790718835304823e-05, "loss": 1.4756, "step": 984 }, { "epoch": 0.03, "learning_rate": 1.7925386715195635e-05, "loss": 1.5879, "step": 985 }, { "epoch": 0.03, "learning_rate": 1.794358507734304e-05, "loss": 1.6646, "step": 986 }, { "epoch": 0.03, "learning_rate": 1.796178343949045e-05, "loss": 1.6621, "step": 987 }, { "epoch": 0.03, "learning_rate": 1.7979981801637855e-05, "loss": 1.6904, "step": 988 }, { "epoch": 0.03, "learning_rate": 1.799818016378526e-05, "loss": 1.7368, "step": 989 }, { "epoch": 0.03, "learning_rate": 1.8016378525932666e-05, "loss": 1.6777, "step": 990 }, { "epoch": 0.03, "learning_rate": 1.8034576888080075e-05, "loss": 1.5171, "step": 991 }, { "epoch": 0.03, "learning_rate": 1.805277525022748e-05, "loss": 1.5259, "step": 992 }, { "epoch": 0.03, "learning_rate": 1.8070973612374886e-05, "loss": 1.5981, "step": 993 }, { "epoch": 0.03, "learning_rate": 1.8089171974522295e-05, "loss": 1.6287, "step": 994 }, { "epoch": 0.03, "learning_rate": 1.81073703366697e-05, "loss": 1.6929, "step": 995 }, { "epoch": 0.03, "learning_rate": 1.812556869881711e-05, "loss": 1.5002, "step": 996 }, { "epoch": 0.03, "learning_rate": 1.8143767060964516e-05, "loss": 1.6206, "step": 997 }, { "epoch": 0.03, "learning_rate": 1.816196542311192e-05, "loss": 1.668, "step": 998 }, { "epoch": 0.03, "learning_rate": 1.8180163785259327e-05, "loss": 1.9268, "step": 999 }, { "epoch": 0.03, "learning_rate": 1.8198362147406733e-05, "loss": 1.6484, "step": 1000 }, { "epoch": 0.03, "learning_rate": 1.821656050955414e-05, "loss": 2.0352, "step": 1001 }, { "epoch": 0.03, "learning_rate": 1.8234758871701547e-05, "loss": 1.3999, "step": 1002 }, { "epoch": 0.03, "learning_rate": 1.8252957233848956e-05, "loss": 1.4749, "step": 1003 }, { "epoch": 0.03, "learning_rate": 1.8271155595996362e-05, "loss": 1.4119, "step": 1004 }, { "epoch": 0.03, "learning_rate": 1.828935395814377e-05, "loss": 1.7988, "step": 1005 }, { "epoch": 0.03, "learning_rate": 1.8307552320291177e-05, "loss": 1.7095, "step": 1006 }, { "epoch": 0.03, "learning_rate": 1.8325750682438582e-05, "loss": 1.5645, "step": 1007 }, { "epoch": 0.03, "learning_rate": 1.8343949044585988e-05, "loss": 1.6904, "step": 1008 }, { "epoch": 0.03, "learning_rate": 1.8362147406733393e-05, "loss": 1.7173, "step": 1009 }, { "epoch": 0.03, "learning_rate": 1.8380345768880802e-05, "loss": 1.666, "step": 1010 }, { "epoch": 0.03, "learning_rate": 1.8398544131028208e-05, "loss": 1.5039, "step": 1011 }, { "epoch": 0.03, "learning_rate": 1.8416742493175617e-05, "loss": 1.6963, "step": 1012 }, { "epoch": 0.03, "learning_rate": 1.8434940855323023e-05, "loss": 1.6948, "step": 1013 }, { "epoch": 0.03, "learning_rate": 1.845313921747043e-05, "loss": 1.667, "step": 1014 }, { "epoch": 0.03, "learning_rate": 1.8471337579617837e-05, "loss": 1.4907, "step": 1015 }, { "epoch": 0.03, "learning_rate": 1.8489535941765243e-05, "loss": 1.7285, "step": 1016 }, { "epoch": 0.03, "learning_rate": 1.850773430391265e-05, "loss": 1.6763, "step": 1017 }, { "epoch": 0.03, "learning_rate": 1.8525932666060054e-05, "loss": 1.6392, "step": 1018 }, { "epoch": 0.03, "learning_rate": 1.8544131028207463e-05, "loss": 1.6265, "step": 1019 }, { "epoch": 0.03, "learning_rate": 1.856232939035487e-05, "loss": 1.4673, "step": 1020 }, { "epoch": 0.03, "learning_rate": 1.8580527752502275e-05, "loss": 1.5966, "step": 1021 }, { "epoch": 0.03, "learning_rate": 1.8598726114649684e-05, "loss": 1.5942, "step": 1022 }, { "epoch": 0.03, "learning_rate": 1.861692447679709e-05, "loss": 1.6392, "step": 1023 }, { "epoch": 0.03, "learning_rate": 1.8635122838944498e-05, "loss": 1.5898, "step": 1024 }, { "epoch": 0.03, "learning_rate": 1.8653321201091904e-05, "loss": 1.603, "step": 1025 }, { "epoch": 0.03, "learning_rate": 1.867151956323931e-05, "loss": 1.646, "step": 1026 }, { "epoch": 0.03, "learning_rate": 1.8689717925386715e-05, "loss": 1.5771, "step": 1027 }, { "epoch": 0.03, "learning_rate": 1.8707916287534124e-05, "loss": 1.7891, "step": 1028 }, { "epoch": 0.03, "learning_rate": 1.872611464968153e-05, "loss": 1.5283, "step": 1029 }, { "epoch": 0.03, "learning_rate": 1.8744313011828935e-05, "loss": 1.5752, "step": 1030 }, { "epoch": 0.03, "learning_rate": 1.8762511373976344e-05, "loss": 1.603, "step": 1031 }, { "epoch": 0.03, "learning_rate": 1.878070973612375e-05, "loss": 1.7573, "step": 1032 }, { "epoch": 0.03, "learning_rate": 1.879890809827116e-05, "loss": 1.6611, "step": 1033 }, { "epoch": 0.03, "learning_rate": 1.8817106460418565e-05, "loss": 1.6187, "step": 1034 }, { "epoch": 0.03, "learning_rate": 1.883530482256597e-05, "loss": 1.5759, "step": 1035 }, { "epoch": 0.03, "learning_rate": 1.8853503184713376e-05, "loss": 1.6885, "step": 1036 }, { "epoch": 0.03, "learning_rate": 1.8871701546860785e-05, "loss": 1.603, "step": 1037 }, { "epoch": 0.03, "learning_rate": 1.888989990900819e-05, "loss": 1.7061, "step": 1038 }, { "epoch": 0.03, "learning_rate": 1.8908098271155596e-05, "loss": 1.5664, "step": 1039 }, { "epoch": 0.03, "learning_rate": 1.8926296633303005e-05, "loss": 1.7734, "step": 1040 }, { "epoch": 0.03, "learning_rate": 1.894449499545041e-05, "loss": 1.6165, "step": 1041 }, { "epoch": 0.03, "learning_rate": 1.8962693357597816e-05, "loss": 1.5405, "step": 1042 }, { "epoch": 0.03, "learning_rate": 1.8980891719745225e-05, "loss": 1.6182, "step": 1043 }, { "epoch": 0.03, "learning_rate": 1.899909008189263e-05, "loss": 1.6572, "step": 1044 }, { "epoch": 0.03, "learning_rate": 1.901728844404004e-05, "loss": 1.7712, "step": 1045 }, { "epoch": 0.03, "learning_rate": 1.9035486806187446e-05, "loss": 1.6875, "step": 1046 }, { "epoch": 0.03, "learning_rate": 1.905368516833485e-05, "loss": 1.7993, "step": 1047 }, { "epoch": 0.03, "learning_rate": 1.9071883530482257e-05, "loss": 1.5728, "step": 1048 }, { "epoch": 0.03, "learning_rate": 1.9090081892629663e-05, "loss": 1.6138, "step": 1049 }, { "epoch": 0.03, "learning_rate": 1.910828025477707e-05, "loss": 1.7317, "step": 1050 }, { "epoch": 0.03, "learning_rate": 1.9126478616924477e-05, "loss": 1.9961, "step": 1051 }, { "epoch": 0.03, "learning_rate": 1.9144676979071886e-05, "loss": 1.6128, "step": 1052 }, { "epoch": 0.03, "learning_rate": 1.9162875341219292e-05, "loss": 1.5933, "step": 1053 }, { "epoch": 0.03, "learning_rate": 1.91810737033667e-05, "loss": 1.6421, "step": 1054 }, { "epoch": 0.03, "learning_rate": 1.9199272065514107e-05, "loss": 1.6113, "step": 1055 }, { "epoch": 0.03, "learning_rate": 1.9217470427661512e-05, "loss": 1.6035, "step": 1056 }, { "epoch": 0.03, "learning_rate": 1.9235668789808918e-05, "loss": 1.6055, "step": 1057 }, { "epoch": 0.03, "learning_rate": 1.9253867151956323e-05, "loss": 1.543, "step": 1058 }, { "epoch": 0.03, "learning_rate": 1.9272065514103732e-05, "loss": 1.6987, "step": 1059 }, { "epoch": 0.03, "learning_rate": 1.9290263876251138e-05, "loss": 1.9043, "step": 1060 }, { "epoch": 0.03, "learning_rate": 1.9308462238398547e-05, "loss": 1.6816, "step": 1061 }, { "epoch": 0.03, "learning_rate": 1.9326660600545953e-05, "loss": 1.4492, "step": 1062 }, { "epoch": 0.03, "learning_rate": 1.9344858962693362e-05, "loss": 1.6982, "step": 1063 }, { "epoch": 0.03, "learning_rate": 1.9363057324840767e-05, "loss": 1.8223, "step": 1064 }, { "epoch": 0.03, "learning_rate": 1.9381255686988173e-05, "loss": 1.5728, "step": 1065 }, { "epoch": 0.03, "learning_rate": 1.939945404913558e-05, "loss": 1.6108, "step": 1066 }, { "epoch": 0.03, "learning_rate": 1.9417652411282984e-05, "loss": 1.6113, "step": 1067 }, { "epoch": 0.03, "learning_rate": 1.9435850773430393e-05, "loss": 1.4299, "step": 1068 }, { "epoch": 0.03, "learning_rate": 1.94540491355778e-05, "loss": 1.7275, "step": 1069 }, { "epoch": 0.03, "learning_rate": 1.9472247497725208e-05, "loss": 1.5, "step": 1070 }, { "epoch": 0.03, "learning_rate": 1.9490445859872614e-05, "loss": 1.6792, "step": 1071 }, { "epoch": 0.03, "learning_rate": 1.950864422202002e-05, "loss": 1.6919, "step": 1072 }, { "epoch": 0.03, "learning_rate": 1.9526842584167428e-05, "loss": 1.9136, "step": 1073 }, { "epoch": 0.03, "learning_rate": 1.9545040946314834e-05, "loss": 1.54, "step": 1074 }, { "epoch": 0.03, "learning_rate": 1.956323930846224e-05, "loss": 1.7007, "step": 1075 }, { "epoch": 0.03, "learning_rate": 1.9581437670609645e-05, "loss": 1.6533, "step": 1076 }, { "epoch": 0.03, "learning_rate": 1.9599636032757054e-05, "loss": 1.792, "step": 1077 }, { "epoch": 0.03, "learning_rate": 1.961783439490446e-05, "loss": 1.6553, "step": 1078 }, { "epoch": 0.03, "learning_rate": 1.9636032757051865e-05, "loss": 1.5176, "step": 1079 }, { "epoch": 0.03, "learning_rate": 1.9654231119199274e-05, "loss": 1.8794, "step": 1080 }, { "epoch": 0.03, "learning_rate": 1.967242948134668e-05, "loss": 1.6011, "step": 1081 }, { "epoch": 0.03, "learning_rate": 1.969062784349409e-05, "loss": 1.6069, "step": 1082 }, { "epoch": 0.03, "learning_rate": 1.9708826205641495e-05, "loss": 1.5571, "step": 1083 }, { "epoch": 0.03, "learning_rate": 1.97270245677889e-05, "loss": 1.5667, "step": 1084 }, { "epoch": 0.03, "learning_rate": 1.9745222929936306e-05, "loss": 1.4343, "step": 1085 }, { "epoch": 0.03, "learning_rate": 1.976342129208371e-05, "loss": 1.4961, "step": 1086 }, { "epoch": 0.03, "learning_rate": 1.978161965423112e-05, "loss": 1.7544, "step": 1087 }, { "epoch": 0.03, "learning_rate": 1.9799818016378526e-05, "loss": 1.6333, "step": 1088 }, { "epoch": 0.03, "learning_rate": 1.9818016378525935e-05, "loss": 1.6182, "step": 1089 }, { "epoch": 0.03, "learning_rate": 1.983621474067334e-05, "loss": 1.5803, "step": 1090 }, { "epoch": 0.03, "learning_rate": 1.985441310282075e-05, "loss": 1.6396, "step": 1091 }, { "epoch": 0.03, "learning_rate": 1.9872611464968155e-05, "loss": 1.6389, "step": 1092 }, { "epoch": 0.03, "learning_rate": 1.989080982711556e-05, "loss": 1.4771, "step": 1093 }, { "epoch": 0.03, "learning_rate": 1.9909008189262967e-05, "loss": 1.6631, "step": 1094 }, { "epoch": 0.03, "learning_rate": 1.9927206551410376e-05, "loss": 1.6904, "step": 1095 }, { "epoch": 0.03, "learning_rate": 1.994540491355778e-05, "loss": 1.5474, "step": 1096 }, { "epoch": 0.03, "learning_rate": 1.9963603275705187e-05, "loss": 1.6157, "step": 1097 }, { "epoch": 0.03, "learning_rate": 1.9981801637852596e-05, "loss": 1.5874, "step": 1098 }, { "epoch": 0.03, "learning_rate": 2e-05, "loss": 1.5986, "step": 1099 }, { "epoch": 0.03, "learning_rate": 1.9999999960882353e-05, "loss": 1.6323, "step": 1100 }, { "epoch": 0.03, "learning_rate": 1.9999999843529404e-05, "loss": 1.5498, "step": 1101 }, { "epoch": 0.03, "learning_rate": 1.9999999647941165e-05, "loss": 1.6782, "step": 1102 }, { "epoch": 0.03, "learning_rate": 1.9999999374117626e-05, "loss": 1.6123, "step": 1103 }, { "epoch": 0.03, "learning_rate": 1.9999999022058797e-05, "loss": 1.6426, "step": 1104 }, { "epoch": 0.03, "learning_rate": 1.9999998591764674e-05, "loss": 1.6406, "step": 1105 }, { "epoch": 0.03, "learning_rate": 1.9999998083235268e-05, "loss": 1.4731, "step": 1106 }, { "epoch": 0.03, "learning_rate": 1.9999997496470578e-05, "loss": 1.479, "step": 1107 }, { "epoch": 0.03, "learning_rate": 1.999999683147061e-05, "loss": 1.5857, "step": 1108 }, { "epoch": 0.03, "learning_rate": 1.999999608823537e-05, "loss": 1.5962, "step": 1109 }, { "epoch": 0.03, "learning_rate": 1.9999995266764866e-05, "loss": 1.9678, "step": 1110 }, { "epoch": 0.03, "learning_rate": 1.9999994367059094e-05, "loss": 1.4417, "step": 1111 }, { "epoch": 0.03, "learning_rate": 1.9999993389118072e-05, "loss": 1.688, "step": 1112 }, { "epoch": 0.03, "learning_rate": 1.9999992332941804e-05, "loss": 1.7129, "step": 1113 }, { "epoch": 0.03, "learning_rate": 1.99999911985303e-05, "loss": 1.7202, "step": 1114 }, { "epoch": 0.03, "learning_rate": 1.9999989985883563e-05, "loss": 1.7349, "step": 1115 }, { "epoch": 0.03, "learning_rate": 1.999998869500161e-05, "loss": 1.4502, "step": 1116 }, { "epoch": 0.03, "learning_rate": 1.999998732588445e-05, "loss": 1.7661, "step": 1117 }, { "epoch": 0.03, "learning_rate": 1.9999985878532087e-05, "loss": 1.457, "step": 1118 }, { "epoch": 0.03, "learning_rate": 1.9999984352944536e-05, "loss": 1.4648, "step": 1119 }, { "epoch": 0.03, "learning_rate": 1.9999982749121813e-05, "loss": 1.6006, "step": 1120 }, { "epoch": 0.03, "learning_rate": 1.9999981067063928e-05, "loss": 1.5615, "step": 1121 }, { "epoch": 0.03, "learning_rate": 1.9999979306770892e-05, "loss": 1.7134, "step": 1122 }, { "epoch": 0.03, "learning_rate": 1.999997746824272e-05, "loss": 1.9385, "step": 1123 }, { "epoch": 0.03, "learning_rate": 1.9999975551479425e-05, "loss": 1.5808, "step": 1124 }, { "epoch": 0.03, "learning_rate": 1.9999973556481027e-05, "loss": 1.6392, "step": 1125 }, { "epoch": 0.03, "learning_rate": 1.9999971483247535e-05, "loss": 1.6333, "step": 1126 }, { "epoch": 0.03, "learning_rate": 1.9999969331778974e-05, "loss": 1.5549, "step": 1127 }, { "epoch": 0.03, "learning_rate": 1.999996710207535e-05, "loss": 1.5122, "step": 1128 }, { "epoch": 0.03, "learning_rate": 1.9999964794136685e-05, "loss": 1.5508, "step": 1129 }, { "epoch": 0.03, "learning_rate": 1.9999962407962998e-05, "loss": 1.5286, "step": 1130 }, { "epoch": 0.03, "learning_rate": 1.9999959943554313e-05, "loss": 1.666, "step": 1131 }, { "epoch": 0.03, "learning_rate": 1.999995740091064e-05, "loss": 1.6333, "step": 1132 }, { "epoch": 0.03, "learning_rate": 1.9999954780032e-05, "loss": 1.6006, "step": 1133 }, { "epoch": 0.03, "learning_rate": 1.999995208091842e-05, "loss": 1.5779, "step": 1134 }, { "epoch": 0.03, "learning_rate": 1.9999949303569915e-05, "loss": 1.8027, "step": 1135 }, { "epoch": 0.03, "learning_rate": 1.999994644798651e-05, "loss": 1.6367, "step": 1136 }, { "epoch": 0.03, "learning_rate": 1.9999943514168226e-05, "loss": 1.5662, "step": 1137 }, { "epoch": 0.03, "learning_rate": 1.9999940502115084e-05, "loss": 1.5703, "step": 1138 }, { "epoch": 0.03, "learning_rate": 1.9999937411827113e-05, "loss": 1.7036, "step": 1139 }, { "epoch": 0.03, "learning_rate": 1.9999934243304333e-05, "loss": 1.6919, "step": 1140 }, { "epoch": 0.03, "learning_rate": 1.999993099654677e-05, "loss": 1.6826, "step": 1141 }, { "epoch": 0.03, "learning_rate": 1.9999927671554448e-05, "loss": 1.7842, "step": 1142 }, { "epoch": 0.03, "learning_rate": 1.9999924268327397e-05, "loss": 1.4775, "step": 1143 }, { "epoch": 0.03, "learning_rate": 1.999992078686564e-05, "loss": 1.5427, "step": 1144 }, { "epoch": 0.03, "learning_rate": 1.9999917227169203e-05, "loss": 1.687, "step": 1145 }, { "epoch": 0.03, "learning_rate": 1.9999913589238118e-05, "loss": 1.6938, "step": 1146 }, { "epoch": 0.03, "learning_rate": 1.999990987307241e-05, "loss": 1.4739, "step": 1147 }, { "epoch": 0.03, "learning_rate": 1.999990607867211e-05, "loss": 1.561, "step": 1148 }, { "epoch": 0.03, "learning_rate": 1.9999902206037248e-05, "loss": 1.7974, "step": 1149 }, { "epoch": 0.03, "learning_rate": 1.999989825516785e-05, "loss": 1.7595, "step": 1150 }, { "epoch": 0.03, "learning_rate": 1.999989422606395e-05, "loss": 1.5742, "step": 1151 }, { "epoch": 0.03, "learning_rate": 1.9999890118725583e-05, "loss": 1.668, "step": 1152 }, { "epoch": 0.03, "learning_rate": 1.999988593315278e-05, "loss": 1.5129, "step": 1153 }, { "epoch": 0.03, "learning_rate": 1.999988166934557e-05, "loss": 1.7036, "step": 1154 }, { "epoch": 0.03, "learning_rate": 1.999987732730399e-05, "loss": 1.5352, "step": 1155 }, { "epoch": 0.03, "learning_rate": 1.9999872907028065e-05, "loss": 1.5525, "step": 1156 }, { "epoch": 0.03, "learning_rate": 1.999986840851784e-05, "loss": 1.5332, "step": 1157 }, { "epoch": 0.03, "learning_rate": 1.999986383177335e-05, "loss": 1.5383, "step": 1158 }, { "epoch": 0.03, "learning_rate": 1.9999859176794623e-05, "loss": 1.6123, "step": 1159 }, { "epoch": 0.03, "learning_rate": 1.9999854443581704e-05, "loss": 1.5815, "step": 1160 }, { "epoch": 0.03, "learning_rate": 1.9999849632134626e-05, "loss": 1.3809, "step": 1161 }, { "epoch": 0.03, "learning_rate": 1.9999844742453426e-05, "loss": 1.7295, "step": 1162 }, { "epoch": 0.03, "learning_rate": 1.9999839774538143e-05, "loss": 1.5181, "step": 1163 }, { "epoch": 0.03, "learning_rate": 1.9999834728388813e-05, "loss": 1.6914, "step": 1164 }, { "epoch": 0.03, "learning_rate": 1.9999829604005483e-05, "loss": 1.5688, "step": 1165 }, { "epoch": 0.03, "learning_rate": 1.9999824401388185e-05, "loss": 1.6748, "step": 1166 }, { "epoch": 0.03, "learning_rate": 1.9999819120536962e-05, "loss": 1.6484, "step": 1167 }, { "epoch": 0.03, "learning_rate": 1.9999813761451862e-05, "loss": 1.6641, "step": 1168 }, { "epoch": 0.03, "learning_rate": 1.9999808324132915e-05, "loss": 1.5496, "step": 1169 }, { "epoch": 0.03, "learning_rate": 1.9999802808580176e-05, "loss": 1.6167, "step": 1170 }, { "epoch": 0.03, "learning_rate": 1.9999797214793677e-05, "loss": 1.6704, "step": 1171 }, { "epoch": 0.03, "learning_rate": 1.999979154277347e-05, "loss": 1.5713, "step": 1172 }, { "epoch": 0.03, "learning_rate": 1.9999785792519594e-05, "loss": 1.5596, "step": 1173 }, { "epoch": 0.03, "learning_rate": 1.9999779964032098e-05, "loss": 1.6675, "step": 1174 }, { "epoch": 0.03, "learning_rate": 1.9999774057311025e-05, "loss": 1.6218, "step": 1175 }, { "epoch": 0.03, "learning_rate": 1.999976807235642e-05, "loss": 1.6851, "step": 1176 }, { "epoch": 0.03, "learning_rate": 1.9999762009168336e-05, "loss": 1.6428, "step": 1177 }, { "epoch": 0.03, "learning_rate": 1.9999755867746814e-05, "loss": 1.7178, "step": 1178 }, { "epoch": 0.03, "learning_rate": 1.9999749648091903e-05, "loss": 1.6226, "step": 1179 }, { "epoch": 0.03, "learning_rate": 1.9999743350203656e-05, "loss": 1.7271, "step": 1180 }, { "epoch": 0.03, "learning_rate": 1.999973697408212e-05, "loss": 1.5913, "step": 1181 }, { "epoch": 0.03, "learning_rate": 1.999973051972734e-05, "loss": 1.6331, "step": 1182 }, { "epoch": 0.03, "learning_rate": 1.9999723987139373e-05, "loss": 1.7063, "step": 1183 }, { "epoch": 0.03, "learning_rate": 1.9999717376318267e-05, "loss": 1.7378, "step": 1184 }, { "epoch": 0.03, "learning_rate": 1.9999710687264073e-05, "loss": 1.9272, "step": 1185 }, { "epoch": 0.03, "learning_rate": 1.9999703919976845e-05, "loss": 1.5952, "step": 1186 }, { "epoch": 0.03, "learning_rate": 1.999969707445664e-05, "loss": 1.4478, "step": 1187 }, { "epoch": 0.03, "learning_rate": 1.9999690150703503e-05, "loss": 1.4744, "step": 1188 }, { "epoch": 0.03, "learning_rate": 1.9999683148717492e-05, "loss": 1.5334, "step": 1189 }, { "epoch": 0.03, "learning_rate": 1.9999676068498665e-05, "loss": 1.6699, "step": 1190 }, { "epoch": 0.03, "learning_rate": 1.9999668910047076e-05, "loss": 1.6638, "step": 1191 }, { "epoch": 0.03, "learning_rate": 1.9999661673362774e-05, "loss": 1.7344, "step": 1192 }, { "epoch": 0.03, "learning_rate": 1.9999654358445826e-05, "loss": 1.6665, "step": 1193 }, { "epoch": 0.03, "learning_rate": 1.9999646965296284e-05, "loss": 1.7134, "step": 1194 }, { "epoch": 0.03, "learning_rate": 1.9999639493914206e-05, "loss": 1.585, "step": 1195 }, { "epoch": 0.03, "learning_rate": 1.999963194429965e-05, "loss": 1.6248, "step": 1196 }, { "epoch": 0.03, "learning_rate": 1.9999624316452674e-05, "loss": 1.728, "step": 1197 }, { "epoch": 0.03, "learning_rate": 1.9999616610373342e-05, "loss": 1.6167, "step": 1198 }, { "epoch": 0.03, "learning_rate": 1.9999608826061712e-05, "loss": 1.6562, "step": 1199 }, { "epoch": 0.03, "learning_rate": 1.9999600963517844e-05, "loss": 1.6099, "step": 1200 }, { "epoch": 0.03, "learning_rate": 1.9999593022741796e-05, "loss": 1.6792, "step": 1201 }, { "epoch": 0.03, "learning_rate": 1.9999585003733643e-05, "loss": 1.7065, "step": 1202 }, { "epoch": 0.03, "learning_rate": 1.9999576906493432e-05, "loss": 1.6626, "step": 1203 }, { "epoch": 0.03, "learning_rate": 1.9999568731021238e-05, "loss": 1.5898, "step": 1204 }, { "epoch": 0.03, "learning_rate": 1.9999560477317118e-05, "loss": 1.6309, "step": 1205 }, { "epoch": 0.03, "learning_rate": 1.9999552145381136e-05, "loss": 1.5251, "step": 1206 }, { "epoch": 0.03, "learning_rate": 1.9999543735213365e-05, "loss": 1.6338, "step": 1207 }, { "epoch": 0.03, "learning_rate": 1.9999535246813864e-05, "loss": 1.6084, "step": 1208 }, { "epoch": 0.03, "learning_rate": 1.99995266801827e-05, "loss": 1.562, "step": 1209 }, { "epoch": 0.03, "learning_rate": 1.9999518035319942e-05, "loss": 1.7939, "step": 1210 }, { "epoch": 0.03, "learning_rate": 1.999950931222566e-05, "loss": 1.4258, "step": 1211 }, { "epoch": 0.03, "learning_rate": 1.9999500510899917e-05, "loss": 1.6338, "step": 1212 }, { "epoch": 0.03, "learning_rate": 1.9999491631342786e-05, "loss": 1.4751, "step": 1213 }, { "epoch": 0.03, "learning_rate": 1.9999482673554333e-05, "loss": 1.5703, "step": 1214 }, { "epoch": 0.03, "learning_rate": 1.9999473637534628e-05, "loss": 1.5703, "step": 1215 }, { "epoch": 0.03, "learning_rate": 1.9999464523283743e-05, "loss": 1.5459, "step": 1216 }, { "epoch": 0.03, "learning_rate": 1.9999455330801752e-05, "loss": 1.457, "step": 1217 }, { "epoch": 0.03, "learning_rate": 1.9999446060088727e-05, "loss": 1.5132, "step": 1218 }, { "epoch": 0.03, "learning_rate": 1.9999436711144734e-05, "loss": 1.6567, "step": 1219 }, { "epoch": 0.03, "learning_rate": 1.999942728396985e-05, "loss": 1.5815, "step": 1220 }, { "epoch": 0.03, "learning_rate": 1.999941777856415e-05, "loss": 1.5417, "step": 1221 }, { "epoch": 0.03, "learning_rate": 1.9999408194927708e-05, "loss": 1.6484, "step": 1222 }, { "epoch": 0.03, "learning_rate": 1.99993985330606e-05, "loss": 1.709, "step": 1223 }, { "epoch": 0.03, "learning_rate": 1.9999388792962895e-05, "loss": 1.6196, "step": 1224 }, { "epoch": 0.03, "learning_rate": 1.9999378974634676e-05, "loss": 1.8047, "step": 1225 }, { "epoch": 0.03, "learning_rate": 1.999936907807602e-05, "loss": 1.689, "step": 1226 }, { "epoch": 0.03, "learning_rate": 1.9999359103287003e-05, "loss": 1.7778, "step": 1227 }, { "epoch": 0.03, "learning_rate": 1.99993490502677e-05, "loss": 1.5596, "step": 1228 }, { "epoch": 0.03, "learning_rate": 1.9999338919018192e-05, "loss": 1.5566, "step": 1229 }, { "epoch": 0.03, "learning_rate": 1.999932870953856e-05, "loss": 1.6499, "step": 1230 }, { "epoch": 0.03, "learning_rate": 1.9999318421828882e-05, "loss": 1.5933, "step": 1231 }, { "epoch": 0.03, "learning_rate": 1.9999308055889238e-05, "loss": 1.708, "step": 1232 }, { "epoch": 0.03, "learning_rate": 1.999929761171971e-05, "loss": 1.6865, "step": 1233 }, { "epoch": 0.03, "learning_rate": 1.9999287089320378e-05, "loss": 1.532, "step": 1234 }, { "epoch": 0.03, "learning_rate": 1.9999276488691327e-05, "loss": 1.6787, "step": 1235 }, { "epoch": 0.03, "learning_rate": 1.999926580983264e-05, "loss": 1.584, "step": 1236 }, { "epoch": 0.03, "learning_rate": 1.99992550527444e-05, "loss": 1.5132, "step": 1237 }, { "epoch": 0.03, "learning_rate": 1.9999244217426687e-05, "loss": 1.4785, "step": 1238 }, { "epoch": 0.03, "learning_rate": 1.9999233303879592e-05, "loss": 1.5786, "step": 1239 }, { "epoch": 0.03, "learning_rate": 1.9999222312103194e-05, "loss": 1.5356, "step": 1240 }, { "epoch": 0.03, "learning_rate": 1.9999211242097588e-05, "loss": 1.5444, "step": 1241 }, { "epoch": 0.03, "learning_rate": 1.999920009386285e-05, "loss": 1.7568, "step": 1242 }, { "epoch": 0.03, "learning_rate": 1.9999188867399076e-05, "loss": 1.605, "step": 1243 }, { "epoch": 0.03, "learning_rate": 1.9999177562706345e-05, "loss": 1.604, "step": 1244 }, { "epoch": 0.03, "learning_rate": 1.9999166179784756e-05, "loss": 1.5247, "step": 1245 }, { "epoch": 0.03, "learning_rate": 1.999915471863439e-05, "loss": 1.7422, "step": 1246 }, { "epoch": 0.03, "learning_rate": 1.9999143179255344e-05, "loss": 1.6567, "step": 1247 }, { "epoch": 0.03, "learning_rate": 1.99991315616477e-05, "loss": 1.5732, "step": 1248 }, { "epoch": 0.03, "learning_rate": 1.999911986581155e-05, "loss": 1.4644, "step": 1249 }, { "epoch": 0.03, "learning_rate": 1.9999108091746992e-05, "loss": 1.6367, "step": 1250 }, { "epoch": 0.03, "learning_rate": 1.9999096239454116e-05, "loss": 1.6392, "step": 1251 }, { "epoch": 0.03, "learning_rate": 1.999908430893301e-05, "loss": 1.6094, "step": 1252 }, { "epoch": 0.03, "learning_rate": 1.999907230018377e-05, "loss": 1.6338, "step": 1253 }, { "epoch": 0.03, "learning_rate": 1.999906021320649e-05, "loss": 1.7119, "step": 1254 }, { "epoch": 0.03, "learning_rate": 1.9999048048001266e-05, "loss": 1.6343, "step": 1255 }, { "epoch": 0.03, "learning_rate": 1.9999035804568192e-05, "loss": 1.6797, "step": 1256 }, { "epoch": 0.03, "learning_rate": 1.9999023482907363e-05, "loss": 1.54, "step": 1257 }, { "epoch": 0.03, "learning_rate": 1.9999011083018874e-05, "loss": 1.7021, "step": 1258 }, { "epoch": 0.03, "learning_rate": 1.9998998604902827e-05, "loss": 1.5366, "step": 1259 }, { "epoch": 0.03, "learning_rate": 1.9998986048559316e-05, "loss": 1.5813, "step": 1260 }, { "epoch": 0.03, "learning_rate": 1.9998973413988443e-05, "loss": 1.5596, "step": 1261 }, { "epoch": 0.03, "learning_rate": 1.99989607011903e-05, "loss": 1.5322, "step": 1262 }, { "epoch": 0.03, "learning_rate": 1.999894791016499e-05, "loss": 1.5811, "step": 1263 }, { "epoch": 0.03, "learning_rate": 1.9998935040912618e-05, "loss": 1.7095, "step": 1264 }, { "epoch": 0.03, "learning_rate": 1.9998922093433276e-05, "loss": 1.6587, "step": 1265 }, { "epoch": 0.03, "learning_rate": 1.999890906772707e-05, "loss": 1.5928, "step": 1266 }, { "epoch": 0.03, "learning_rate": 1.99988959637941e-05, "loss": 1.6074, "step": 1267 }, { "epoch": 0.03, "learning_rate": 1.9998882781634475e-05, "loss": 1.5271, "step": 1268 }, { "epoch": 0.03, "learning_rate": 1.9998869521248288e-05, "loss": 1.5688, "step": 1269 }, { "epoch": 0.03, "learning_rate": 1.9998856182635647e-05, "loss": 1.7915, "step": 1270 }, { "epoch": 0.03, "learning_rate": 1.999884276579666e-05, "loss": 1.6165, "step": 1271 }, { "epoch": 0.03, "learning_rate": 1.9998829270731427e-05, "loss": 1.6621, "step": 1272 }, { "epoch": 0.03, "learning_rate": 1.9998815697440058e-05, "loss": 1.6113, "step": 1273 }, { "epoch": 0.03, "learning_rate": 1.9998802045922655e-05, "loss": 1.6094, "step": 1274 }, { "epoch": 0.03, "learning_rate": 1.9998788316179326e-05, "loss": 1.6934, "step": 1275 }, { "epoch": 0.03, "learning_rate": 1.999877450821018e-05, "loss": 1.6284, "step": 1276 }, { "epoch": 0.03, "learning_rate": 1.9998760622015324e-05, "loss": 1.5293, "step": 1277 }, { "epoch": 0.03, "learning_rate": 1.9998746657594867e-05, "loss": 1.647, "step": 1278 }, { "epoch": 0.03, "learning_rate": 1.9998732614948918e-05, "loss": 1.5957, "step": 1279 }, { "epoch": 0.03, "learning_rate": 1.9998718494077586e-05, "loss": 1.5767, "step": 1280 }, { "epoch": 0.03, "learning_rate": 1.9998704294980982e-05, "loss": 1.5793, "step": 1281 }, { "epoch": 0.04, "learning_rate": 1.9998690017659215e-05, "loss": 1.5161, "step": 1282 }, { "epoch": 0.04, "learning_rate": 1.9998675662112404e-05, "loss": 1.4873, "step": 1283 }, { "epoch": 0.04, "learning_rate": 1.9998661228340654e-05, "loss": 1.6904, "step": 1284 }, { "epoch": 0.04, "learning_rate": 1.999864671634408e-05, "loss": 1.626, "step": 1285 }, { "epoch": 0.04, "learning_rate": 1.9998632126122795e-05, "loss": 1.6023, "step": 1286 }, { "epoch": 0.04, "learning_rate": 1.9998617457676914e-05, "loss": 1.8848, "step": 1287 }, { "epoch": 0.04, "learning_rate": 1.9998602711006555e-05, "loss": 1.5415, "step": 1288 }, { "epoch": 0.04, "learning_rate": 1.9998587886111825e-05, "loss": 1.9199, "step": 1289 }, { "epoch": 0.04, "learning_rate": 1.999857298299285e-05, "loss": 1.6697, "step": 1290 }, { "epoch": 0.04, "learning_rate": 1.9998558001649736e-05, "loss": 1.4763, "step": 1291 }, { "epoch": 0.04, "learning_rate": 1.999854294208261e-05, "loss": 1.6294, "step": 1292 }, { "epoch": 0.04, "learning_rate": 1.9998527804291586e-05, "loss": 1.4897, "step": 1293 }, { "epoch": 0.04, "learning_rate": 1.999851258827678e-05, "loss": 1.6353, "step": 1294 }, { "epoch": 0.04, "learning_rate": 1.9998497294038316e-05, "loss": 1.6401, "step": 1295 }, { "epoch": 0.04, "learning_rate": 1.999848192157631e-05, "loss": 1.6318, "step": 1296 }, { "epoch": 0.04, "learning_rate": 1.999846647089088e-05, "loss": 1.5957, "step": 1297 }, { "epoch": 0.04, "learning_rate": 1.9998450941982154e-05, "loss": 1.6626, "step": 1298 }, { "epoch": 0.04, "learning_rate": 1.9998435334850244e-05, "loss": 1.6943, "step": 1299 }, { "epoch": 0.04, "learning_rate": 1.9998419649495286e-05, "loss": 1.5947, "step": 1300 }, { "epoch": 0.04, "learning_rate": 1.9998403885917387e-05, "loss": 1.6089, "step": 1301 }, { "epoch": 0.04, "learning_rate": 1.999838804411668e-05, "loss": 1.4641, "step": 1302 }, { "epoch": 0.04, "learning_rate": 1.9998372124093283e-05, "loss": 1.6113, "step": 1303 }, { "epoch": 0.04, "learning_rate": 1.999835612584733e-05, "loss": 1.688, "step": 1304 }, { "epoch": 0.04, "learning_rate": 1.999834004937894e-05, "loss": 1.582, "step": 1305 }, { "epoch": 0.04, "learning_rate": 1.999832389468823e-05, "loss": 1.6304, "step": 1306 }, { "epoch": 0.04, "learning_rate": 1.9998307661775346e-05, "loss": 1.7017, "step": 1307 }, { "epoch": 0.04, "learning_rate": 1.9998291350640398e-05, "loss": 1.6543, "step": 1308 }, { "epoch": 0.04, "learning_rate": 1.9998274961283523e-05, "loss": 1.5125, "step": 1309 }, { "epoch": 0.04, "learning_rate": 1.999825849370485e-05, "loss": 1.4834, "step": 1310 }, { "epoch": 0.04, "learning_rate": 1.9998241947904495e-05, "loss": 1.6812, "step": 1311 }, { "epoch": 0.04, "learning_rate": 1.9998225323882603e-05, "loss": 1.7148, "step": 1312 }, { "epoch": 0.04, "learning_rate": 1.9998208621639296e-05, "loss": 1.563, "step": 1313 }, { "epoch": 0.04, "learning_rate": 1.9998191841174705e-05, "loss": 1.6333, "step": 1314 }, { "epoch": 0.04, "learning_rate": 1.9998174982488962e-05, "loss": 1.4878, "step": 1315 }, { "epoch": 0.04, "learning_rate": 1.99981580455822e-05, "loss": 1.6416, "step": 1316 }, { "epoch": 0.04, "learning_rate": 1.999814103045455e-05, "loss": 1.5864, "step": 1317 }, { "epoch": 0.04, "learning_rate": 1.9998123937106153e-05, "loss": 1.5112, "step": 1318 }, { "epoch": 0.04, "learning_rate": 1.999810676553713e-05, "loss": 1.8999, "step": 1319 }, { "epoch": 0.04, "learning_rate": 1.9998089515747622e-05, "loss": 1.6135, "step": 1320 }, { "epoch": 0.04, "learning_rate": 1.9998072187737762e-05, "loss": 1.6367, "step": 1321 }, { "epoch": 0.04, "learning_rate": 1.9998054781507686e-05, "loss": 1.6274, "step": 1322 }, { "epoch": 0.04, "learning_rate": 1.9998037297057533e-05, "loss": 1.5898, "step": 1323 }, { "epoch": 0.04, "learning_rate": 1.9998019734387438e-05, "loss": 1.606, "step": 1324 }, { "epoch": 0.04, "learning_rate": 1.9998002093497536e-05, "loss": 1.7349, "step": 1325 }, { "epoch": 0.04, "learning_rate": 1.9997984374387967e-05, "loss": 1.5635, "step": 1326 }, { "epoch": 0.04, "learning_rate": 1.9997966577058872e-05, "loss": 1.748, "step": 1327 }, { "epoch": 0.04, "learning_rate": 1.9997948701510385e-05, "loss": 1.6904, "step": 1328 }, { "epoch": 0.04, "learning_rate": 1.999793074774265e-05, "loss": 1.6655, "step": 1329 }, { "epoch": 0.04, "learning_rate": 1.9997912715755807e-05, "loss": 1.6182, "step": 1330 }, { "epoch": 0.04, "learning_rate": 1.9997894605549994e-05, "loss": 1.7031, "step": 1331 }, { "epoch": 0.04, "learning_rate": 1.9997876417125357e-05, "loss": 1.6475, "step": 1332 }, { "epoch": 0.04, "learning_rate": 1.9997858150482036e-05, "loss": 1.7004, "step": 1333 }, { "epoch": 0.04, "learning_rate": 1.9997839805620175e-05, "loss": 1.437, "step": 1334 }, { "epoch": 0.04, "learning_rate": 1.9997821382539914e-05, "loss": 1.626, "step": 1335 }, { "epoch": 0.04, "learning_rate": 1.9997802881241402e-05, "loss": 1.625, "step": 1336 }, { "epoch": 0.04, "learning_rate": 1.9997784301724777e-05, "loss": 1.6479, "step": 1337 }, { "epoch": 0.04, "learning_rate": 1.9997765643990196e-05, "loss": 1.6694, "step": 1338 }, { "epoch": 0.04, "learning_rate": 1.9997746908037794e-05, "loss": 1.7563, "step": 1339 }, { "epoch": 0.04, "learning_rate": 1.999772809386772e-05, "loss": 1.6597, "step": 1340 }, { "epoch": 0.04, "learning_rate": 1.9997709201480127e-05, "loss": 1.4773, "step": 1341 }, { "epoch": 0.04, "learning_rate": 1.9997690230875156e-05, "loss": 1.6592, "step": 1342 }, { "epoch": 0.04, "learning_rate": 1.9997671182052958e-05, "loss": 1.4695, "step": 1343 }, { "epoch": 0.04, "learning_rate": 1.999765205501368e-05, "loss": 1.5967, "step": 1344 }, { "epoch": 0.04, "learning_rate": 1.9997632849757477e-05, "loss": 1.689, "step": 1345 }, { "epoch": 0.04, "learning_rate": 1.9997613566284496e-05, "loss": 1.717, "step": 1346 }, { "epoch": 0.04, "learning_rate": 1.9997594204594883e-05, "loss": 1.5459, "step": 1347 }, { "epoch": 0.04, "learning_rate": 1.9997574764688797e-05, "loss": 1.5552, "step": 1348 }, { "epoch": 0.04, "learning_rate": 1.999755524656639e-05, "loss": 1.5295, "step": 1349 }, { "epoch": 0.04, "learning_rate": 1.999753565022781e-05, "loss": 1.897, "step": 1350 }, { "epoch": 0.04, "learning_rate": 1.999751597567321e-05, "loss": 1.8267, "step": 1351 }, { "epoch": 0.04, "learning_rate": 1.9997496222902746e-05, "loss": 1.5566, "step": 1352 }, { "epoch": 0.04, "learning_rate": 1.999747639191658e-05, "loss": 1.5298, "step": 1353 }, { "epoch": 0.04, "learning_rate": 1.999745648271485e-05, "loss": 1.5859, "step": 1354 }, { "epoch": 0.04, "learning_rate": 1.9997436495297726e-05, "loss": 1.6895, "step": 1355 }, { "epoch": 0.04, "learning_rate": 1.999741642966536e-05, "loss": 1.4604, "step": 1356 }, { "epoch": 0.04, "learning_rate": 1.9997396285817907e-05, "loss": 1.6021, "step": 1357 }, { "epoch": 0.04, "learning_rate": 1.999737606375553e-05, "loss": 1.5679, "step": 1358 }, { "epoch": 0.04, "learning_rate": 1.9997355763478385e-05, "loss": 1.6807, "step": 1359 }, { "epoch": 0.04, "learning_rate": 1.9997335384986624e-05, "loss": 1.502, "step": 1360 }, { "epoch": 0.04, "learning_rate": 1.9997314928280413e-05, "loss": 1.6035, "step": 1361 }, { "epoch": 0.04, "learning_rate": 1.9997294393359915e-05, "loss": 1.543, "step": 1362 }, { "epoch": 0.04, "learning_rate": 1.9997273780225282e-05, "loss": 1.4636, "step": 1363 }, { "epoch": 0.04, "learning_rate": 1.9997253088876684e-05, "loss": 1.6313, "step": 1364 }, { "epoch": 0.04, "learning_rate": 1.999723231931428e-05, "loss": 1.3921, "step": 1365 }, { "epoch": 0.04, "learning_rate": 1.9997211471538226e-05, "loss": 1.7314, "step": 1366 }, { "epoch": 0.04, "learning_rate": 1.9997190545548695e-05, "loss": 1.6177, "step": 1367 }, { "epoch": 0.04, "learning_rate": 1.9997169541345842e-05, "loss": 1.5103, "step": 1368 }, { "epoch": 0.04, "learning_rate": 1.9997148458929837e-05, "loss": 1.5918, "step": 1369 }, { "epoch": 0.04, "learning_rate": 1.9997127298300846e-05, "loss": 1.5811, "step": 1370 }, { "epoch": 0.04, "learning_rate": 1.999710605945903e-05, "loss": 1.5762, "step": 1371 }, { "epoch": 0.04, "learning_rate": 1.999708474240456e-05, "loss": 1.4507, "step": 1372 }, { "epoch": 0.04, "learning_rate": 1.9997063347137596e-05, "loss": 1.5198, "step": 1373 }, { "epoch": 0.04, "learning_rate": 1.999704187365831e-05, "loss": 1.4863, "step": 1374 }, { "epoch": 0.04, "learning_rate": 1.9997020321966872e-05, "loss": 1.6177, "step": 1375 }, { "epoch": 0.04, "learning_rate": 1.9996998692063445e-05, "loss": 1.6885, "step": 1376 }, { "epoch": 0.04, "learning_rate": 1.9996976983948203e-05, "loss": 1.6025, "step": 1377 }, { "epoch": 0.04, "learning_rate": 1.9996955197621313e-05, "loss": 1.4631, "step": 1378 }, { "epoch": 0.04, "learning_rate": 1.9996933333082945e-05, "loss": 1.5054, "step": 1379 }, { "epoch": 0.04, "learning_rate": 1.9996911390333275e-05, "loss": 1.6738, "step": 1380 }, { "epoch": 0.04, "learning_rate": 1.999688936937247e-05, "loss": 1.4854, "step": 1381 }, { "epoch": 0.04, "learning_rate": 1.9996867270200703e-05, "loss": 1.6162, "step": 1382 }, { "epoch": 0.04, "learning_rate": 1.9996845092818146e-05, "loss": 1.6558, "step": 1383 }, { "epoch": 0.04, "learning_rate": 1.9996822837224975e-05, "loss": 1.6196, "step": 1384 }, { "epoch": 0.04, "learning_rate": 1.9996800503421362e-05, "loss": 1.6304, "step": 1385 }, { "epoch": 0.04, "learning_rate": 1.9996778091407484e-05, "loss": 1.8076, "step": 1386 }, { "epoch": 0.04, "learning_rate": 1.9996755601183513e-05, "loss": 1.6353, "step": 1387 }, { "epoch": 0.04, "learning_rate": 1.9996733032749633e-05, "loss": 1.4927, "step": 1388 }, { "epoch": 0.04, "learning_rate": 1.999671038610601e-05, "loss": 1.4543, "step": 1389 }, { "epoch": 0.04, "learning_rate": 1.9996687661252824e-05, "loss": 1.4783, "step": 1390 }, { "epoch": 0.04, "learning_rate": 1.9996664858190254e-05, "loss": 1.7534, "step": 1391 }, { "epoch": 0.04, "learning_rate": 1.9996641976918483e-05, "loss": 1.4927, "step": 1392 }, { "epoch": 0.04, "learning_rate": 1.9996619017437684e-05, "loss": 1.6182, "step": 1393 }, { "epoch": 0.04, "learning_rate": 1.999659597974804e-05, "loss": 1.385, "step": 1394 }, { "epoch": 0.04, "learning_rate": 1.9996572863849727e-05, "loss": 1.5737, "step": 1395 }, { "epoch": 0.04, "learning_rate": 1.9996549669742932e-05, "loss": 1.625, "step": 1396 }, { "epoch": 0.04, "learning_rate": 1.999652639742783e-05, "loss": 1.5186, "step": 1397 }, { "epoch": 0.04, "learning_rate": 1.9996503046904608e-05, "loss": 1.6157, "step": 1398 }, { "epoch": 0.04, "learning_rate": 1.9996479618173444e-05, "loss": 1.5176, "step": 1399 }, { "epoch": 0.04, "learning_rate": 1.999645611123453e-05, "loss": 1.6006, "step": 1400 }, { "epoch": 0.04, "learning_rate": 1.9996432526088038e-05, "loss": 1.5715, "step": 1401 }, { "epoch": 0.04, "learning_rate": 1.999640886273416e-05, "loss": 1.687, "step": 1402 }, { "epoch": 0.04, "learning_rate": 1.9996385121173084e-05, "loss": 1.5601, "step": 1403 }, { "epoch": 0.04, "learning_rate": 1.9996361301404986e-05, "loss": 1.7026, "step": 1404 }, { "epoch": 0.04, "learning_rate": 1.9996337403430058e-05, "loss": 1.5164, "step": 1405 }, { "epoch": 0.04, "learning_rate": 1.999631342724849e-05, "loss": 1.4062, "step": 1406 }, { "epoch": 0.04, "learning_rate": 1.9996289372860468e-05, "loss": 1.6021, "step": 1407 }, { "epoch": 0.04, "learning_rate": 1.9996265240266172e-05, "loss": 1.5122, "step": 1408 }, { "epoch": 0.04, "learning_rate": 1.9996241029465802e-05, "loss": 1.4919, "step": 1409 }, { "epoch": 0.04, "learning_rate": 1.9996216740459544e-05, "loss": 1.5283, "step": 1410 }, { "epoch": 0.04, "learning_rate": 1.9996192373247584e-05, "loss": 1.3916, "step": 1411 }, { "epoch": 0.04, "learning_rate": 1.9996167927830115e-05, "loss": 1.7202, "step": 1412 }, { "epoch": 0.04, "learning_rate": 1.999614340420733e-05, "loss": 1.6011, "step": 1413 }, { "epoch": 0.04, "learning_rate": 1.9996118802379416e-05, "loss": 1.6113, "step": 1414 }, { "epoch": 0.04, "learning_rate": 1.999609412234657e-05, "loss": 1.6406, "step": 1415 }, { "epoch": 0.04, "learning_rate": 1.999606936410899e-05, "loss": 1.6455, "step": 1416 }, { "epoch": 0.04, "learning_rate": 1.999604452766686e-05, "loss": 1.5195, "step": 1417 }, { "epoch": 0.04, "learning_rate": 1.9996019613020378e-05, "loss": 1.4946, "step": 1418 }, { "epoch": 0.04, "learning_rate": 1.9995994620169738e-05, "loss": 1.6729, "step": 1419 }, { "epoch": 0.04, "learning_rate": 1.999596954911514e-05, "loss": 1.6738, "step": 1420 }, { "epoch": 0.04, "learning_rate": 1.9995944399856773e-05, "loss": 1.7363, "step": 1421 }, { "epoch": 0.04, "learning_rate": 1.999591917239484e-05, "loss": 1.5562, "step": 1422 }, { "epoch": 0.04, "learning_rate": 1.9995893866729533e-05, "loss": 1.6436, "step": 1423 }, { "epoch": 0.04, "learning_rate": 1.9995868482861054e-05, "loss": 1.8789, "step": 1424 }, { "epoch": 0.04, "learning_rate": 1.99958430207896e-05, "loss": 1.5745, "step": 1425 }, { "epoch": 0.04, "learning_rate": 1.9995817480515373e-05, "loss": 1.7075, "step": 1426 }, { "epoch": 0.04, "learning_rate": 1.9995791862038567e-05, "loss": 1.6123, "step": 1427 }, { "epoch": 0.04, "learning_rate": 1.9995766165359388e-05, "loss": 1.3733, "step": 1428 }, { "epoch": 0.04, "learning_rate": 1.9995740390478033e-05, "loss": 1.4146, "step": 1429 }, { "epoch": 0.04, "learning_rate": 1.9995714537394708e-05, "loss": 1.5649, "step": 1430 }, { "epoch": 0.04, "learning_rate": 1.999568860610961e-05, "loss": 1.6567, "step": 1431 }, { "epoch": 0.04, "learning_rate": 1.9995662596622945e-05, "loss": 1.6089, "step": 1432 }, { "epoch": 0.04, "learning_rate": 1.999563650893492e-05, "loss": 1.7603, "step": 1433 }, { "epoch": 0.04, "learning_rate": 1.9995610343045734e-05, "loss": 1.4692, "step": 1434 }, { "epoch": 0.04, "learning_rate": 1.9995584098955588e-05, "loss": 1.7632, "step": 1435 }, { "epoch": 0.04, "learning_rate": 1.9995557776664697e-05, "loss": 1.9062, "step": 1436 }, { "epoch": 0.04, "learning_rate": 1.999553137617326e-05, "loss": 1.6675, "step": 1437 }, { "epoch": 0.04, "learning_rate": 1.9995504897481487e-05, "loss": 1.51, "step": 1438 }, { "epoch": 0.04, "learning_rate": 1.9995478340589585e-05, "loss": 1.6255, "step": 1439 }, { "epoch": 0.04, "learning_rate": 1.9995451705497758e-05, "loss": 1.5881, "step": 1440 }, { "epoch": 0.04, "learning_rate": 1.999542499220622e-05, "loss": 1.5842, "step": 1441 }, { "epoch": 0.04, "learning_rate": 1.9995398200715176e-05, "loss": 1.5962, "step": 1442 }, { "epoch": 0.04, "learning_rate": 1.9995371331024835e-05, "loss": 1.5967, "step": 1443 }, { "epoch": 0.04, "learning_rate": 1.999534438313541e-05, "loss": 1.4744, "step": 1444 }, { "epoch": 0.04, "learning_rate": 1.999531735704711e-05, "loss": 1.573, "step": 1445 }, { "epoch": 0.04, "learning_rate": 1.9995290252760148e-05, "loss": 1.5322, "step": 1446 }, { "epoch": 0.04, "learning_rate": 1.9995263070274736e-05, "loss": 1.8667, "step": 1447 }, { "epoch": 0.04, "learning_rate": 1.9995235809591086e-05, "loss": 1.4353, "step": 1448 }, { "epoch": 0.04, "learning_rate": 1.9995208470709405e-05, "loss": 1.439, "step": 1449 }, { "epoch": 0.04, "learning_rate": 1.999518105362992e-05, "loss": 1.5781, "step": 1450 }, { "epoch": 0.04, "learning_rate": 1.999515355835284e-05, "loss": 1.5669, "step": 1451 }, { "epoch": 0.04, "learning_rate": 1.999512598487837e-05, "loss": 1.458, "step": 1452 }, { "epoch": 0.04, "learning_rate": 1.999509833320674e-05, "loss": 1.5254, "step": 1453 }, { "epoch": 0.04, "learning_rate": 1.9995070603338162e-05, "loss": 1.4937, "step": 1454 }, { "epoch": 0.04, "learning_rate": 1.999504279527285e-05, "loss": 1.5869, "step": 1455 }, { "epoch": 0.04, "learning_rate": 1.999501490901102e-05, "loss": 1.5991, "step": 1456 }, { "epoch": 0.04, "learning_rate": 1.99949869445529e-05, "loss": 1.7051, "step": 1457 }, { "epoch": 0.04, "learning_rate": 1.9994958901898696e-05, "loss": 1.6719, "step": 1458 }, { "epoch": 0.04, "learning_rate": 1.9994930781048633e-05, "loss": 1.5674, "step": 1459 }, { "epoch": 0.04, "learning_rate": 1.9994902582002934e-05, "loss": 1.4028, "step": 1460 }, { "epoch": 0.04, "learning_rate": 1.999487430476182e-05, "loss": 1.6064, "step": 1461 }, { "epoch": 0.04, "learning_rate": 1.9994845949325508e-05, "loss": 1.7056, "step": 1462 }, { "epoch": 0.04, "learning_rate": 1.9994817515694218e-05, "loss": 1.6147, "step": 1463 }, { "epoch": 0.04, "learning_rate": 1.999478900386818e-05, "loss": 1.6382, "step": 1464 }, { "epoch": 0.04, "learning_rate": 1.9994760413847607e-05, "loss": 1.6631, "step": 1465 }, { "epoch": 0.04, "learning_rate": 1.9994731745632734e-05, "loss": 1.5581, "step": 1466 }, { "epoch": 0.04, "learning_rate": 1.9994702999223777e-05, "loss": 1.5, "step": 1467 }, { "epoch": 0.04, "learning_rate": 1.9994674174620964e-05, "loss": 1.6118, "step": 1468 }, { "epoch": 0.04, "learning_rate": 1.9994645271824518e-05, "loss": 1.4756, "step": 1469 }, { "epoch": 0.04, "learning_rate": 1.999461629083467e-05, "loss": 1.5862, "step": 1470 }, { "epoch": 0.04, "learning_rate": 1.9994587231651644e-05, "loss": 1.5793, "step": 1471 }, { "epoch": 0.04, "learning_rate": 1.9994558094275667e-05, "loss": 1.5422, "step": 1472 }, { "epoch": 0.04, "learning_rate": 1.9994528878706965e-05, "loss": 1.689, "step": 1473 }, { "epoch": 0.04, "learning_rate": 1.999449958494577e-05, "loss": 1.5537, "step": 1474 }, { "epoch": 0.04, "learning_rate": 1.999447021299231e-05, "loss": 1.7227, "step": 1475 }, { "epoch": 0.04, "learning_rate": 1.999444076284682e-05, "loss": 1.4299, "step": 1476 }, { "epoch": 0.04, "learning_rate": 1.9994411234509518e-05, "loss": 1.5874, "step": 1477 }, { "epoch": 0.04, "learning_rate": 1.9994381627980643e-05, "loss": 1.4971, "step": 1478 }, { "epoch": 0.04, "learning_rate": 1.999435194326043e-05, "loss": 1.3582, "step": 1479 }, { "epoch": 0.04, "learning_rate": 1.9994322180349103e-05, "loss": 1.6011, "step": 1480 }, { "epoch": 0.04, "learning_rate": 1.99942923392469e-05, "loss": 1.5432, "step": 1481 }, { "epoch": 0.04, "learning_rate": 1.9994262419954055e-05, "loss": 1.4585, "step": 1482 }, { "epoch": 0.04, "learning_rate": 1.9994232422470798e-05, "loss": 1.5991, "step": 1483 }, { "epoch": 0.04, "learning_rate": 1.999420234679737e-05, "loss": 1.5532, "step": 1484 }, { "epoch": 0.04, "learning_rate": 1.9994172192934e-05, "loss": 1.6626, "step": 1485 }, { "epoch": 0.04, "learning_rate": 1.9994141960880926e-05, "loss": 1.5381, "step": 1486 }, { "epoch": 0.04, "learning_rate": 1.9994111650638383e-05, "loss": 1.551, "step": 1487 }, { "epoch": 0.04, "learning_rate": 1.999408126220661e-05, "loss": 1.665, "step": 1488 }, { "epoch": 0.04, "learning_rate": 1.9994050795585852e-05, "loss": 1.6519, "step": 1489 }, { "epoch": 0.04, "learning_rate": 1.9994020250776335e-05, "loss": 1.5669, "step": 1490 }, { "epoch": 0.04, "learning_rate": 1.99939896277783e-05, "loss": 1.5879, "step": 1491 }, { "epoch": 0.04, "learning_rate": 1.9993958926591995e-05, "loss": 1.502, "step": 1492 }, { "epoch": 0.04, "learning_rate": 1.9993928147217652e-05, "loss": 1.3508, "step": 1493 }, { "epoch": 0.04, "learning_rate": 1.9993897289655514e-05, "loss": 1.6172, "step": 1494 }, { "epoch": 0.04, "learning_rate": 1.9993866353905824e-05, "loss": 1.5327, "step": 1495 }, { "epoch": 0.04, "learning_rate": 1.9993835339968824e-05, "loss": 1.363, "step": 1496 }, { "epoch": 0.04, "learning_rate": 1.9993804247844753e-05, "loss": 1.686, "step": 1497 }, { "epoch": 0.04, "learning_rate": 1.999377307753386e-05, "loss": 1.667, "step": 1498 }, { "epoch": 0.04, "learning_rate": 1.9993741829036387e-05, "loss": 1.6147, "step": 1499 }, { "epoch": 0.04, "learning_rate": 1.9993710502352573e-05, "loss": 1.5801, "step": 1500 }, { "epoch": 0.04, "learning_rate": 1.999367909748267e-05, "loss": 1.7646, "step": 1501 }, { "epoch": 0.04, "learning_rate": 1.9993647614426922e-05, "loss": 1.6157, "step": 1502 }, { "epoch": 0.04, "learning_rate": 1.9993616053185573e-05, "loss": 1.5034, "step": 1503 }, { "epoch": 0.04, "learning_rate": 1.999358441375887e-05, "loss": 1.625, "step": 1504 }, { "epoch": 0.04, "learning_rate": 1.9993552696147065e-05, "loss": 1.6416, "step": 1505 }, { "epoch": 0.04, "learning_rate": 1.99935209003504e-05, "loss": 1.6289, "step": 1506 }, { "epoch": 0.04, "learning_rate": 1.999348902636913e-05, "loss": 1.6206, "step": 1507 }, { "epoch": 0.04, "learning_rate": 1.9993457074203498e-05, "loss": 1.5049, "step": 1508 }, { "epoch": 0.04, "learning_rate": 1.9993425043853758e-05, "loss": 1.6523, "step": 1509 }, { "epoch": 0.04, "learning_rate": 1.9993392935320163e-05, "loss": 1.397, "step": 1510 }, { "epoch": 0.04, "learning_rate": 1.9993360748602953e-05, "loss": 1.5059, "step": 1511 }, { "epoch": 0.04, "learning_rate": 1.9993328483702393e-05, "loss": 1.5742, "step": 1512 }, { "epoch": 0.04, "learning_rate": 1.999329614061873e-05, "loss": 1.4358, "step": 1513 }, { "epoch": 0.04, "learning_rate": 1.999326371935222e-05, "loss": 1.5986, "step": 1514 }, { "epoch": 0.04, "learning_rate": 1.9993231219903108e-05, "loss": 1.3293, "step": 1515 }, { "epoch": 0.04, "learning_rate": 1.9993198642271658e-05, "loss": 1.4719, "step": 1516 }, { "epoch": 0.04, "learning_rate": 1.9993165986458122e-05, "loss": 1.6357, "step": 1517 }, { "epoch": 0.04, "learning_rate": 1.999313325246275e-05, "loss": 1.5286, "step": 1518 }, { "epoch": 0.04, "learning_rate": 1.9993100440285805e-05, "loss": 1.4717, "step": 1519 }, { "epoch": 0.04, "learning_rate": 1.9993067549927542e-05, "loss": 1.468, "step": 1520 }, { "epoch": 0.04, "learning_rate": 1.9993034581388215e-05, "loss": 1.9043, "step": 1521 }, { "epoch": 0.04, "learning_rate": 1.9993001534668087e-05, "loss": 1.5771, "step": 1522 }, { "epoch": 0.04, "learning_rate": 1.9992968409767413e-05, "loss": 1.4429, "step": 1523 }, { "epoch": 0.04, "learning_rate": 1.9992935206686453e-05, "loss": 1.6274, "step": 1524 }, { "epoch": 0.04, "learning_rate": 1.9992901925425466e-05, "loss": 1.5469, "step": 1525 }, { "epoch": 0.04, "learning_rate": 1.9992868565984717e-05, "loss": 1.519, "step": 1526 }, { "epoch": 0.04, "learning_rate": 1.999283512836446e-05, "loss": 1.6387, "step": 1527 }, { "epoch": 0.04, "learning_rate": 1.999280161256496e-05, "loss": 1.6157, "step": 1528 }, { "epoch": 0.04, "learning_rate": 1.999276801858648e-05, "loss": 1.7119, "step": 1529 }, { "epoch": 0.04, "learning_rate": 1.9992734346429285e-05, "loss": 1.5442, "step": 1530 }, { "epoch": 0.04, "learning_rate": 1.9992700596093632e-05, "loss": 1.6284, "step": 1531 }, { "epoch": 0.04, "learning_rate": 1.9992666767579786e-05, "loss": 1.6377, "step": 1532 }, { "epoch": 0.04, "learning_rate": 1.9992632860888017e-05, "loss": 1.5757, "step": 1533 }, { "epoch": 0.04, "learning_rate": 1.9992598876018588e-05, "loss": 1.6655, "step": 1534 }, { "epoch": 0.04, "learning_rate": 1.9992564812971764e-05, "loss": 1.5317, "step": 1535 }, { "epoch": 0.04, "learning_rate": 1.999253067174781e-05, "loss": 1.5308, "step": 1536 }, { "epoch": 0.04, "learning_rate": 1.9992496452346996e-05, "loss": 1.5947, "step": 1537 }, { "epoch": 0.04, "learning_rate": 1.999246215476959e-05, "loss": 1.4048, "step": 1538 }, { "epoch": 0.04, "learning_rate": 1.999242777901586e-05, "loss": 1.5195, "step": 1539 }, { "epoch": 0.04, "learning_rate": 1.9992393325086067e-05, "loss": 1.563, "step": 1540 }, { "epoch": 0.04, "learning_rate": 1.9992358792980492e-05, "loss": 1.5625, "step": 1541 }, { "epoch": 0.04, "learning_rate": 1.9992324182699403e-05, "loss": 1.645, "step": 1542 }, { "epoch": 0.04, "learning_rate": 1.9992289494243066e-05, "loss": 1.6602, "step": 1543 }, { "epoch": 0.04, "learning_rate": 1.9992254727611753e-05, "loss": 1.583, "step": 1544 }, { "epoch": 0.04, "learning_rate": 1.999221988280574e-05, "loss": 1.4583, "step": 1545 }, { "epoch": 0.04, "learning_rate": 1.9992184959825292e-05, "loss": 1.5098, "step": 1546 }, { "epoch": 0.04, "learning_rate": 1.9992149958670692e-05, "loss": 1.6904, "step": 1547 }, { "epoch": 0.04, "learning_rate": 1.999211487934221e-05, "loss": 1.5938, "step": 1548 }, { "epoch": 0.04, "learning_rate": 1.999207972184012e-05, "loss": 1.6567, "step": 1549 }, { "epoch": 0.04, "learning_rate": 1.9992044486164695e-05, "loss": 1.4717, "step": 1550 }, { "epoch": 0.04, "learning_rate": 1.9992009172316214e-05, "loss": 1.8096, "step": 1551 }, { "epoch": 0.04, "learning_rate": 1.999197378029495e-05, "loss": 1.5439, "step": 1552 }, { "epoch": 0.04, "learning_rate": 1.9991938310101186e-05, "loss": 1.6553, "step": 1553 }, { "epoch": 0.04, "learning_rate": 1.9991902761735187e-05, "loss": 1.5591, "step": 1554 }, { "epoch": 0.04, "learning_rate": 1.9991867135197247e-05, "loss": 1.5061, "step": 1555 }, { "epoch": 0.04, "learning_rate": 1.9991831430487635e-05, "loss": 1.584, "step": 1556 }, { "epoch": 0.04, "learning_rate": 1.999179564760663e-05, "loss": 1.4468, "step": 1557 }, { "epoch": 0.04, "learning_rate": 1.9991759786554515e-05, "loss": 1.5474, "step": 1558 }, { "epoch": 0.04, "learning_rate": 1.9991723847331574e-05, "loss": 1.5833, "step": 1559 }, { "epoch": 0.04, "learning_rate": 1.9991687829938082e-05, "loss": 1.6162, "step": 1560 }, { "epoch": 0.04, "learning_rate": 1.9991651734374322e-05, "loss": 1.4258, "step": 1561 }, { "epoch": 0.04, "learning_rate": 1.9991615560640575e-05, "loss": 1.6411, "step": 1562 }, { "epoch": 0.04, "learning_rate": 1.999157930873713e-05, "loss": 1.4927, "step": 1563 }, { "epoch": 0.04, "learning_rate": 1.9991542978664264e-05, "loss": 1.3994, "step": 1564 }, { "epoch": 0.04, "learning_rate": 1.9991506570422266e-05, "loss": 1.6626, "step": 1565 }, { "epoch": 0.04, "learning_rate": 1.999147008401142e-05, "loss": 1.4893, "step": 1566 }, { "epoch": 0.04, "learning_rate": 1.9991433519432008e-05, "loss": 1.6548, "step": 1567 }, { "epoch": 0.04, "learning_rate": 1.9991396876684317e-05, "loss": 1.5562, "step": 1568 }, { "epoch": 0.04, "learning_rate": 1.9991360155768638e-05, "loss": 1.6699, "step": 1569 }, { "epoch": 0.04, "learning_rate": 1.9991323356685255e-05, "loss": 1.5278, "step": 1570 }, { "epoch": 0.04, "learning_rate": 1.9991286479434456e-05, "loss": 1.6299, "step": 1571 }, { "epoch": 0.04, "learning_rate": 1.999124952401653e-05, "loss": 1.5879, "step": 1572 }, { "epoch": 0.04, "learning_rate": 1.9991212490431767e-05, "loss": 1.6353, "step": 1573 }, { "epoch": 0.04, "learning_rate": 1.9991175378680452e-05, "loss": 1.6274, "step": 1574 }, { "epoch": 0.04, "learning_rate": 1.999113818876288e-05, "loss": 1.603, "step": 1575 }, { "epoch": 0.04, "learning_rate": 1.9991100920679344e-05, "loss": 1.6392, "step": 1576 }, { "epoch": 0.04, "learning_rate": 1.999106357443013e-05, "loss": 1.7544, "step": 1577 }, { "epoch": 0.04, "learning_rate": 1.9991026150015535e-05, "loss": 1.5952, "step": 1578 }, { "epoch": 0.04, "learning_rate": 1.9990988647435846e-05, "loss": 1.5718, "step": 1579 }, { "epoch": 0.04, "learning_rate": 1.9990951066691364e-05, "loss": 1.6035, "step": 1580 }, { "epoch": 0.04, "learning_rate": 1.9990913407782377e-05, "loss": 1.5288, "step": 1581 }, { "epoch": 0.04, "learning_rate": 1.9990875670709182e-05, "loss": 1.6328, "step": 1582 }, { "epoch": 0.04, "learning_rate": 1.999083785547207e-05, "loss": 1.6919, "step": 1583 }, { "epoch": 0.04, "learning_rate": 1.9990799962071347e-05, "loss": 1.6011, "step": 1584 }, { "epoch": 0.04, "learning_rate": 1.99907619905073e-05, "loss": 1.5566, "step": 1585 }, { "epoch": 0.04, "learning_rate": 1.9990723940780227e-05, "loss": 1.8735, "step": 1586 }, { "epoch": 0.04, "learning_rate": 1.9990685812890432e-05, "loss": 1.645, "step": 1587 }, { "epoch": 0.04, "learning_rate": 1.999064760683821e-05, "loss": 1.4863, "step": 1588 }, { "epoch": 0.04, "learning_rate": 1.9990609322623854e-05, "loss": 1.8906, "step": 1589 }, { "epoch": 0.04, "learning_rate": 1.9990570960247672e-05, "loss": 1.4597, "step": 1590 }, { "epoch": 0.04, "learning_rate": 1.999053251970996e-05, "loss": 1.5454, "step": 1591 }, { "epoch": 0.04, "learning_rate": 1.9990494001011017e-05, "loss": 1.405, "step": 1592 }, { "epoch": 0.04, "learning_rate": 1.9990455404151147e-05, "loss": 1.6084, "step": 1593 }, { "epoch": 0.04, "learning_rate": 1.9990416729130655e-05, "loss": 1.4727, "step": 1594 }, { "epoch": 0.04, "learning_rate": 1.999037797594984e-05, "loss": 1.6516, "step": 1595 }, { "epoch": 0.04, "learning_rate": 1.9990339144609003e-05, "loss": 1.5667, "step": 1596 }, { "epoch": 0.04, "learning_rate": 1.9990300235108452e-05, "loss": 1.531, "step": 1597 }, { "epoch": 0.04, "learning_rate": 1.999026124744849e-05, "loss": 1.6257, "step": 1598 }, { "epoch": 0.04, "learning_rate": 1.999022218162942e-05, "loss": 1.5183, "step": 1599 }, { "epoch": 0.04, "learning_rate": 1.999018303765155e-05, "loss": 1.5725, "step": 1600 }, { "epoch": 0.04, "learning_rate": 1.9990143815515188e-05, "loss": 1.5337, "step": 1601 }, { "epoch": 0.04, "learning_rate": 1.9990104515220636e-05, "loss": 1.5325, "step": 1602 }, { "epoch": 0.04, "learning_rate": 1.9990065136768206e-05, "loss": 1.564, "step": 1603 }, { "epoch": 0.04, "learning_rate": 1.9990025680158202e-05, "loss": 1.5554, "step": 1604 }, { "epoch": 0.04, "learning_rate": 1.9989986145390934e-05, "loss": 1.5181, "step": 1605 }, { "epoch": 0.04, "learning_rate": 1.9989946532466712e-05, "loss": 1.6719, "step": 1606 }, { "epoch": 0.04, "learning_rate": 1.9989906841385853e-05, "loss": 1.5566, "step": 1607 }, { "epoch": 0.04, "learning_rate": 1.998986707214865e-05, "loss": 1.6143, "step": 1608 }, { "epoch": 0.04, "learning_rate": 1.998982722475543e-05, "loss": 1.4678, "step": 1609 }, { "epoch": 0.04, "learning_rate": 1.99897872992065e-05, "loss": 1.4749, "step": 1610 }, { "epoch": 0.04, "learning_rate": 1.998974729550217e-05, "loss": 1.3701, "step": 1611 }, { "epoch": 0.04, "learning_rate": 1.9989707213642755e-05, "loss": 1.6802, "step": 1612 }, { "epoch": 0.04, "learning_rate": 1.998966705362857e-05, "loss": 1.4319, "step": 1613 }, { "epoch": 0.04, "learning_rate": 1.9989626815459923e-05, "loss": 1.646, "step": 1614 }, { "epoch": 0.04, "learning_rate": 1.9989586499137137e-05, "loss": 1.4473, "step": 1615 }, { "epoch": 0.04, "learning_rate": 1.9989546104660524e-05, "loss": 1.4612, "step": 1616 }, { "epoch": 0.04, "learning_rate": 1.9989505632030397e-05, "loss": 1.5942, "step": 1617 }, { "epoch": 0.04, "learning_rate": 1.998946508124708e-05, "loss": 1.708, "step": 1618 }, { "epoch": 0.04, "learning_rate": 1.998942445231088e-05, "loss": 1.5571, "step": 1619 }, { "epoch": 0.04, "learning_rate": 1.998938374522212e-05, "loss": 1.6079, "step": 1620 }, { "epoch": 0.04, "learning_rate": 1.9989342959981125e-05, "loss": 1.7388, "step": 1621 }, { "epoch": 0.04, "learning_rate": 1.9989302096588204e-05, "loss": 1.9067, "step": 1622 }, { "epoch": 0.04, "learning_rate": 1.998926115504368e-05, "loss": 1.6016, "step": 1623 }, { "epoch": 0.04, "learning_rate": 1.9989220135347875e-05, "loss": 1.509, "step": 1624 }, { "epoch": 0.04, "learning_rate": 1.998917903750111e-05, "loss": 1.7017, "step": 1625 }, { "epoch": 0.04, "learning_rate": 1.9989137861503708e-05, "loss": 1.5322, "step": 1626 }, { "epoch": 0.04, "learning_rate": 1.9989096607355983e-05, "loss": 1.6509, "step": 1627 }, { "epoch": 0.04, "learning_rate": 1.9989055275058264e-05, "loss": 1.4099, "step": 1628 }, { "epoch": 0.04, "learning_rate": 1.9989013864610877e-05, "loss": 1.6929, "step": 1629 }, { "epoch": 0.04, "learning_rate": 1.9988972376014142e-05, "loss": 1.8823, "step": 1630 }, { "epoch": 0.04, "learning_rate": 1.998893080926838e-05, "loss": 1.4517, "step": 1631 }, { "epoch": 0.04, "learning_rate": 1.9988889164373927e-05, "loss": 1.5708, "step": 1632 }, { "epoch": 0.04, "learning_rate": 1.9988847441331097e-05, "loss": 1.5884, "step": 1633 }, { "epoch": 0.04, "learning_rate": 1.9988805640140225e-05, "loss": 1.5859, "step": 1634 }, { "epoch": 0.04, "learning_rate": 1.9988763760801632e-05, "loss": 1.623, "step": 1635 }, { "epoch": 0.04, "learning_rate": 1.998872180331565e-05, "loss": 1.5298, "step": 1636 }, { "epoch": 0.04, "learning_rate": 1.998867976768261e-05, "loss": 1.4944, "step": 1637 }, { "epoch": 0.04, "learning_rate": 1.998863765390283e-05, "loss": 1.5811, "step": 1638 }, { "epoch": 0.04, "learning_rate": 1.998859546197665e-05, "loss": 1.5129, "step": 1639 }, { "epoch": 0.04, "learning_rate": 1.9988553191904393e-05, "loss": 1.4062, "step": 1640 }, { "epoch": 0.04, "learning_rate": 1.9988510843686392e-05, "loss": 1.8286, "step": 1641 }, { "epoch": 0.04, "learning_rate": 1.998846841732298e-05, "loss": 1.6572, "step": 1642 }, { "epoch": 0.04, "learning_rate": 1.998842591281449e-05, "loss": 1.5845, "step": 1643 }, { "epoch": 0.04, "learning_rate": 1.9988383330161252e-05, "loss": 1.6672, "step": 1644 }, { "epoch": 0.04, "learning_rate": 1.9988340669363598e-05, "loss": 1.4268, "step": 1645 }, { "epoch": 0.04, "learning_rate": 1.9988297930421865e-05, "loss": 1.4751, "step": 1646 }, { "epoch": 0.04, "learning_rate": 1.9988255113336386e-05, "loss": 1.6182, "step": 1647 }, { "epoch": 0.05, "learning_rate": 1.9988212218107496e-05, "loss": 1.6108, "step": 1648 }, { "epoch": 0.05, "learning_rate": 1.998816924473553e-05, "loss": 1.5771, "step": 1649 }, { "epoch": 0.05, "learning_rate": 1.9988126193220826e-05, "loss": 1.4338, "step": 1650 }, { "epoch": 0.05, "learning_rate": 1.9988083063563713e-05, "loss": 1.7012, "step": 1651 }, { "epoch": 0.05, "learning_rate": 1.998803985576454e-05, "loss": 1.7119, "step": 1652 }, { "epoch": 0.05, "learning_rate": 1.9987996569823643e-05, "loss": 1.5337, "step": 1653 }, { "epoch": 0.05, "learning_rate": 1.9987953205741352e-05, "loss": 1.5884, "step": 1654 }, { "epoch": 0.05, "learning_rate": 1.9987909763518013e-05, "loss": 1.3074, "step": 1655 }, { "epoch": 0.05, "learning_rate": 1.998786624315397e-05, "loss": 1.627, "step": 1656 }, { "epoch": 0.05, "learning_rate": 1.998782264464955e-05, "loss": 1.511, "step": 1657 }, { "epoch": 0.05, "learning_rate": 1.9987778968005107e-05, "loss": 1.5481, "step": 1658 }, { "epoch": 0.05, "learning_rate": 1.9987735213220975e-05, "loss": 1.5981, "step": 1659 }, { "epoch": 0.05, "learning_rate": 1.9987691380297502e-05, "loss": 1.5962, "step": 1660 }, { "epoch": 0.05, "learning_rate": 1.9987647469235026e-05, "loss": 1.5513, "step": 1661 }, { "epoch": 0.05, "learning_rate": 1.9987603480033896e-05, "loss": 1.6582, "step": 1662 }, { "epoch": 0.05, "learning_rate": 1.998755941269445e-05, "loss": 1.6401, "step": 1663 }, { "epoch": 0.05, "learning_rate": 1.9987515267217037e-05, "loss": 1.5127, "step": 1664 }, { "epoch": 0.05, "learning_rate": 1.9987471043602e-05, "loss": 1.5398, "step": 1665 }, { "epoch": 0.05, "learning_rate": 1.9987426741849686e-05, "loss": 1.4683, "step": 1666 }, { "epoch": 0.05, "learning_rate": 1.998738236196044e-05, "loss": 1.5896, "step": 1667 }, { "epoch": 0.05, "learning_rate": 1.9987337903934617e-05, "loss": 1.4351, "step": 1668 }, { "epoch": 0.05, "learning_rate": 1.9987293367772553e-05, "loss": 1.5518, "step": 1669 }, { "epoch": 0.05, "learning_rate": 1.9987248753474603e-05, "loss": 1.6948, "step": 1670 }, { "epoch": 0.05, "learning_rate": 1.9987204061041116e-05, "loss": 1.6821, "step": 1671 }, { "epoch": 0.05, "learning_rate": 1.998715929047244e-05, "loss": 1.5066, "step": 1672 }, { "epoch": 0.05, "learning_rate": 1.9987114441768928e-05, "loss": 1.553, "step": 1673 }, { "epoch": 0.05, "learning_rate": 1.9987069514930925e-05, "loss": 1.4387, "step": 1674 }, { "epoch": 0.05, "learning_rate": 1.9987024509958787e-05, "loss": 1.4492, "step": 1675 }, { "epoch": 0.05, "learning_rate": 1.9986979426852868e-05, "loss": 1.5566, "step": 1676 }, { "epoch": 0.05, "learning_rate": 1.9986934265613516e-05, "loss": 1.5996, "step": 1677 }, { "epoch": 0.05, "learning_rate": 1.998688902624109e-05, "loss": 1.5327, "step": 1678 }, { "epoch": 0.05, "learning_rate": 1.9986843708735937e-05, "loss": 1.5493, "step": 1679 }, { "epoch": 0.05, "learning_rate": 1.9986798313098415e-05, "loss": 1.4929, "step": 1680 }, { "epoch": 0.05, "learning_rate": 1.9986752839328883e-05, "loss": 1.543, "step": 1681 }, { "epoch": 0.05, "learning_rate": 1.998670728742769e-05, "loss": 1.4067, "step": 1682 }, { "epoch": 0.05, "learning_rate": 1.9986661657395196e-05, "loss": 1.5718, "step": 1683 }, { "epoch": 0.05, "learning_rate": 1.9986615949231755e-05, "loss": 1.4539, "step": 1684 }, { "epoch": 0.05, "learning_rate": 1.998657016293773e-05, "loss": 1.5952, "step": 1685 }, { "epoch": 0.05, "learning_rate": 1.9986524298513474e-05, "loss": 1.6172, "step": 1686 }, { "epoch": 0.05, "learning_rate": 1.9986478355959347e-05, "loss": 1.6255, "step": 1687 }, { "epoch": 0.05, "learning_rate": 1.998643233527571e-05, "loss": 1.4502, "step": 1688 }, { "epoch": 0.05, "learning_rate": 1.9986386236462926e-05, "loss": 1.6636, "step": 1689 }, { "epoch": 0.05, "learning_rate": 1.998634005952135e-05, "loss": 1.5884, "step": 1690 }, { "epoch": 0.05, "learning_rate": 1.998629380445134e-05, "loss": 1.3357, "step": 1691 }, { "epoch": 0.05, "learning_rate": 1.998624747125327e-05, "loss": 1.5645, "step": 1692 }, { "epoch": 0.05, "learning_rate": 1.998620105992749e-05, "loss": 1.4216, "step": 1693 }, { "epoch": 0.05, "learning_rate": 1.9986154570474375e-05, "loss": 1.6111, "step": 1694 }, { "epoch": 0.05, "learning_rate": 1.998610800289428e-05, "loss": 1.5977, "step": 1695 }, { "epoch": 0.05, "learning_rate": 1.9986061357187568e-05, "loss": 1.5308, "step": 1696 }, { "epoch": 0.05, "learning_rate": 1.9986014633354612e-05, "loss": 1.6099, "step": 1697 }, { "epoch": 0.05, "learning_rate": 1.9985967831395775e-05, "loss": 1.5361, "step": 1698 }, { "epoch": 0.05, "learning_rate": 1.9985920951311417e-05, "loss": 1.6479, "step": 1699 }, { "epoch": 0.05, "learning_rate": 1.998587399310191e-05, "loss": 1.3652, "step": 1700 }, { "epoch": 0.05, "learning_rate": 1.998582695676762e-05, "loss": 1.55, "step": 1701 }, { "epoch": 0.05, "learning_rate": 1.9985779842308916e-05, "loss": 1.6133, "step": 1702 }, { "epoch": 0.05, "learning_rate": 1.9985732649726168e-05, "loss": 1.5046, "step": 1703 }, { "epoch": 0.05, "learning_rate": 1.9985685379019742e-05, "loss": 1.8188, "step": 1704 }, { "epoch": 0.05, "learning_rate": 1.998563803019001e-05, "loss": 1.5947, "step": 1705 }, { "epoch": 0.05, "learning_rate": 1.9985590603237342e-05, "loss": 1.5835, "step": 1706 }, { "epoch": 0.05, "learning_rate": 1.9985543098162107e-05, "loss": 1.4653, "step": 1707 }, { "epoch": 0.05, "learning_rate": 1.9985495514964678e-05, "loss": 1.4827, "step": 1708 }, { "epoch": 0.05, "learning_rate": 1.998544785364543e-05, "loss": 1.4775, "step": 1709 }, { "epoch": 0.05, "learning_rate": 1.9985400114204734e-05, "loss": 1.5491, "step": 1710 }, { "epoch": 0.05, "learning_rate": 1.998535229664296e-05, "loss": 1.5017, "step": 1711 }, { "epoch": 0.05, "learning_rate": 1.998530440096049e-05, "loss": 1.5391, "step": 1712 }, { "epoch": 0.05, "learning_rate": 1.9985256427157688e-05, "loss": 1.5732, "step": 1713 }, { "epoch": 0.05, "learning_rate": 1.9985208375234933e-05, "loss": 1.5894, "step": 1714 }, { "epoch": 0.05, "learning_rate": 1.998516024519261e-05, "loss": 1.4758, "step": 1715 }, { "epoch": 0.05, "learning_rate": 1.9985112037031087e-05, "loss": 1.8154, "step": 1716 }, { "epoch": 0.05, "learning_rate": 1.998506375075074e-05, "loss": 1.5461, "step": 1717 }, { "epoch": 0.05, "learning_rate": 1.9985015386351955e-05, "loss": 1.5962, "step": 1718 }, { "epoch": 0.05, "learning_rate": 1.9984966943835098e-05, "loss": 1.5505, "step": 1719 }, { "epoch": 0.05, "learning_rate": 1.9984918423200556e-05, "loss": 1.5308, "step": 1720 }, { "epoch": 0.05, "learning_rate": 1.9984869824448712e-05, "loss": 1.501, "step": 1721 }, { "epoch": 0.05, "learning_rate": 1.998482114757994e-05, "loss": 1.6548, "step": 1722 }, { "epoch": 0.05, "learning_rate": 1.998477239259462e-05, "loss": 1.4509, "step": 1723 }, { "epoch": 0.05, "learning_rate": 1.9984723559493137e-05, "loss": 1.5188, "step": 1724 }, { "epoch": 0.05, "learning_rate": 1.9984674648275874e-05, "loss": 1.7134, "step": 1725 }, { "epoch": 0.05, "learning_rate": 1.998462565894321e-05, "loss": 1.7944, "step": 1726 }, { "epoch": 0.05, "learning_rate": 1.998457659149553e-05, "loss": 1.7402, "step": 1727 }, { "epoch": 0.05, "learning_rate": 1.9984527445933216e-05, "loss": 1.6724, "step": 1728 }, { "epoch": 0.05, "learning_rate": 1.998447822225666e-05, "loss": 1.6294, "step": 1729 }, { "epoch": 0.05, "learning_rate": 1.9984428920466236e-05, "loss": 1.563, "step": 1730 }, { "epoch": 0.05, "learning_rate": 1.9984379540562336e-05, "loss": 1.4685, "step": 1731 }, { "epoch": 0.05, "learning_rate": 1.998433008254535e-05, "loss": 1.7544, "step": 1732 }, { "epoch": 0.05, "learning_rate": 1.9984280546415655e-05, "loss": 1.5398, "step": 1733 }, { "epoch": 0.05, "learning_rate": 1.9984230932173646e-05, "loss": 1.687, "step": 1734 }, { "epoch": 0.05, "learning_rate": 1.998418123981971e-05, "loss": 1.5347, "step": 1735 }, { "epoch": 0.05, "learning_rate": 1.9984131469354233e-05, "loss": 1.4883, "step": 1736 }, { "epoch": 0.05, "learning_rate": 1.9984081620777608e-05, "loss": 1.4309, "step": 1737 }, { "epoch": 0.05, "learning_rate": 1.9984031694090224e-05, "loss": 1.5522, "step": 1738 }, { "epoch": 0.05, "learning_rate": 1.9983981689292466e-05, "loss": 1.4756, "step": 1739 }, { "epoch": 0.05, "learning_rate": 1.9983931606384736e-05, "loss": 1.5967, "step": 1740 }, { "epoch": 0.05, "learning_rate": 1.9983881445367415e-05, "loss": 1.5303, "step": 1741 }, { "epoch": 0.05, "learning_rate": 1.99838312062409e-05, "loss": 1.5864, "step": 1742 }, { "epoch": 0.05, "learning_rate": 1.998378088900559e-05, "loss": 1.6196, "step": 1743 }, { "epoch": 0.05, "learning_rate": 1.998373049366187e-05, "loss": 1.5752, "step": 1744 }, { "epoch": 0.05, "learning_rate": 1.9983680020210133e-05, "loss": 1.6055, "step": 1745 }, { "epoch": 0.05, "learning_rate": 1.9983629468650786e-05, "loss": 1.5254, "step": 1746 }, { "epoch": 0.05, "learning_rate": 1.9983578838984213e-05, "loss": 1.6226, "step": 1747 }, { "epoch": 0.05, "learning_rate": 1.9983528131210814e-05, "loss": 1.3474, "step": 1748 }, { "epoch": 0.05, "learning_rate": 1.9983477345330985e-05, "loss": 1.6279, "step": 1749 }, { "epoch": 0.05, "learning_rate": 1.998342648134512e-05, "loss": 1.627, "step": 1750 }, { "epoch": 0.05, "learning_rate": 1.9983375539253627e-05, "loss": 1.533, "step": 1751 }, { "epoch": 0.05, "learning_rate": 1.9983324519056895e-05, "loss": 1.5029, "step": 1752 }, { "epoch": 0.05, "learning_rate": 1.9983273420755328e-05, "loss": 1.5684, "step": 1753 }, { "epoch": 0.05, "learning_rate": 1.9983222244349326e-05, "loss": 1.4634, "step": 1754 }, { "epoch": 0.05, "learning_rate": 1.9983170989839284e-05, "loss": 1.6016, "step": 1755 }, { "epoch": 0.05, "learning_rate": 1.9983119657225607e-05, "loss": 1.5767, "step": 1756 }, { "epoch": 0.05, "learning_rate": 1.99830682465087e-05, "loss": 1.6338, "step": 1757 }, { "epoch": 0.05, "learning_rate": 1.9983016757688954e-05, "loss": 1.5171, "step": 1758 }, { "epoch": 0.05, "learning_rate": 1.9982965190766784e-05, "loss": 1.5762, "step": 1759 }, { "epoch": 0.05, "learning_rate": 1.998291354574259e-05, "loss": 1.6631, "step": 1760 }, { "epoch": 0.05, "learning_rate": 1.9982861822616773e-05, "loss": 1.5742, "step": 1761 }, { "epoch": 0.05, "learning_rate": 1.998281002138974e-05, "loss": 1.5645, "step": 1762 }, { "epoch": 0.05, "learning_rate": 1.9982758142061892e-05, "loss": 1.6118, "step": 1763 }, { "epoch": 0.05, "learning_rate": 1.9982706184633644e-05, "loss": 1.3606, "step": 1764 }, { "epoch": 0.05, "learning_rate": 1.9982654149105393e-05, "loss": 1.522, "step": 1765 }, { "epoch": 0.05, "learning_rate": 1.9982602035477554e-05, "loss": 1.5701, "step": 1766 }, { "epoch": 0.05, "learning_rate": 1.998254984375053e-05, "loss": 1.5432, "step": 1767 }, { "epoch": 0.05, "learning_rate": 1.998249757392473e-05, "loss": 1.6003, "step": 1768 }, { "epoch": 0.05, "learning_rate": 1.998244522600056e-05, "loss": 1.4016, "step": 1769 }, { "epoch": 0.05, "learning_rate": 1.9982392799978432e-05, "loss": 1.4302, "step": 1770 }, { "epoch": 0.05, "learning_rate": 1.9982340295858762e-05, "loss": 1.4893, "step": 1771 }, { "epoch": 0.05, "learning_rate": 1.998228771364195e-05, "loss": 1.4731, "step": 1772 }, { "epoch": 0.05, "learning_rate": 1.9982235053328417e-05, "loss": 1.4341, "step": 1773 }, { "epoch": 0.05, "learning_rate": 1.998218231491857e-05, "loss": 1.5166, "step": 1774 }, { "epoch": 0.05, "learning_rate": 1.9982129498412823e-05, "loss": 1.5286, "step": 1775 }, { "epoch": 0.05, "learning_rate": 1.9982076603811588e-05, "loss": 1.5527, "step": 1776 }, { "epoch": 0.05, "learning_rate": 1.9982023631115276e-05, "loss": 1.5234, "step": 1777 }, { "epoch": 0.05, "learning_rate": 1.998197058032431e-05, "loss": 1.4929, "step": 1778 }, { "epoch": 0.05, "learning_rate": 1.99819174514391e-05, "loss": 1.4885, "step": 1779 }, { "epoch": 0.05, "learning_rate": 1.9981864244460062e-05, "loss": 1.6482, "step": 1780 }, { "epoch": 0.05, "learning_rate": 1.998181095938761e-05, "loss": 1.5271, "step": 1781 }, { "epoch": 0.05, "learning_rate": 1.998175759622216e-05, "loss": 1.6245, "step": 1782 }, { "epoch": 0.05, "learning_rate": 1.9981704154964135e-05, "loss": 1.9185, "step": 1783 }, { "epoch": 0.05, "learning_rate": 1.9981650635613953e-05, "loss": 1.4922, "step": 1784 }, { "epoch": 0.05, "learning_rate": 1.9981597038172028e-05, "loss": 1.5889, "step": 1785 }, { "epoch": 0.05, "learning_rate": 1.998154336263878e-05, "loss": 1.6643, "step": 1786 }, { "epoch": 0.05, "learning_rate": 1.998148960901463e-05, "loss": 1.5974, "step": 1787 }, { "epoch": 0.05, "learning_rate": 1.99814357773e-05, "loss": 1.519, "step": 1788 }, { "epoch": 0.05, "learning_rate": 1.998138186749531e-05, "loss": 1.4575, "step": 1789 }, { "epoch": 0.05, "learning_rate": 1.9981327879600983e-05, "loss": 1.76, "step": 1790 }, { "epoch": 0.05, "learning_rate": 1.998127381361744e-05, "loss": 1.4927, "step": 1791 }, { "epoch": 0.05, "learning_rate": 1.9981219669545108e-05, "loss": 1.4983, "step": 1792 }, { "epoch": 0.05, "learning_rate": 1.9981165447384397e-05, "loss": 1.4609, "step": 1793 }, { "epoch": 0.05, "learning_rate": 1.998111114713575e-05, "loss": 1.5854, "step": 1794 }, { "epoch": 0.05, "learning_rate": 1.998105676879958e-05, "loss": 1.5146, "step": 1795 }, { "epoch": 0.05, "learning_rate": 1.9981002312376314e-05, "loss": 1.5332, "step": 1796 }, { "epoch": 0.05, "learning_rate": 1.998094777786638e-05, "loss": 1.6165, "step": 1797 }, { "epoch": 0.05, "learning_rate": 1.9980893165270207e-05, "loss": 1.4775, "step": 1798 }, { "epoch": 0.05, "learning_rate": 1.9980838474588214e-05, "loss": 1.6445, "step": 1799 }, { "epoch": 0.05, "learning_rate": 1.9980783705820836e-05, "loss": 1.6362, "step": 1800 }, { "epoch": 0.05, "learning_rate": 1.99807288589685e-05, "loss": 1.7886, "step": 1801 }, { "epoch": 0.05, "learning_rate": 1.9980673934031633e-05, "loss": 1.7173, "step": 1802 }, { "epoch": 0.05, "learning_rate": 1.998061893101067e-05, "loss": 1.6309, "step": 1803 }, { "epoch": 0.05, "learning_rate": 1.9980563849906037e-05, "loss": 1.4868, "step": 1804 }, { "epoch": 0.05, "learning_rate": 1.9980508690718165e-05, "loss": 1.3945, "step": 1805 }, { "epoch": 0.05, "learning_rate": 1.9980453453447485e-05, "loss": 1.5542, "step": 1806 }, { "epoch": 0.05, "learning_rate": 1.998039813809443e-05, "loss": 1.8521, "step": 1807 }, { "epoch": 0.05, "learning_rate": 1.9980342744659435e-05, "loss": 1.4851, "step": 1808 }, { "epoch": 0.05, "learning_rate": 1.9980287273142928e-05, "loss": 1.729, "step": 1809 }, { "epoch": 0.05, "learning_rate": 1.998023172354535e-05, "loss": 1.5596, "step": 1810 }, { "epoch": 0.05, "learning_rate": 1.998017609586713e-05, "loss": 1.5601, "step": 1811 }, { "epoch": 0.05, "learning_rate": 1.9980120390108705e-05, "loss": 1.5225, "step": 1812 }, { "epoch": 0.05, "learning_rate": 1.9980064606270514e-05, "loss": 1.5498, "step": 1813 }, { "epoch": 0.05, "learning_rate": 1.9980008744352988e-05, "loss": 1.6821, "step": 1814 }, { "epoch": 0.05, "learning_rate": 1.9979952804356565e-05, "loss": 1.572, "step": 1815 }, { "epoch": 0.05, "learning_rate": 1.997989678628169e-05, "loss": 1.4583, "step": 1816 }, { "epoch": 0.05, "learning_rate": 1.997984069012879e-05, "loss": 1.376, "step": 1817 }, { "epoch": 0.05, "learning_rate": 1.9979784515898313e-05, "loss": 1.4485, "step": 1818 }, { "epoch": 0.05, "learning_rate": 1.997972826359069e-05, "loss": 1.4231, "step": 1819 }, { "epoch": 0.05, "learning_rate": 1.997967193320637e-05, "loss": 1.604, "step": 1820 }, { "epoch": 0.05, "learning_rate": 1.9979615524745786e-05, "loss": 1.4614, "step": 1821 }, { "epoch": 0.05, "learning_rate": 1.9979559038209387e-05, "loss": 1.5352, "step": 1822 }, { "epoch": 0.05, "learning_rate": 1.9979502473597608e-05, "loss": 1.4834, "step": 1823 }, { "epoch": 0.05, "learning_rate": 1.99794458309109e-05, "loss": 1.4685, "step": 1824 }, { "epoch": 0.05, "learning_rate": 1.9979389110149693e-05, "loss": 1.4429, "step": 1825 }, { "epoch": 0.05, "learning_rate": 1.9979332311314442e-05, "loss": 1.4475, "step": 1826 }, { "epoch": 0.05, "learning_rate": 1.9979275434405586e-05, "loss": 1.6836, "step": 1827 }, { "epoch": 0.05, "learning_rate": 1.997921847942357e-05, "loss": 1.6523, "step": 1828 }, { "epoch": 0.05, "learning_rate": 1.9979161446368843e-05, "loss": 1.5322, "step": 1829 }, { "epoch": 0.05, "learning_rate": 1.997910433524185e-05, "loss": 1.5054, "step": 1830 }, { "epoch": 0.05, "learning_rate": 1.9979047146043037e-05, "loss": 1.6758, "step": 1831 }, { "epoch": 0.05, "learning_rate": 1.9978989878772854e-05, "loss": 1.5127, "step": 1832 }, { "epoch": 0.05, "learning_rate": 1.997893253343174e-05, "loss": 1.3948, "step": 1833 }, { "epoch": 0.05, "learning_rate": 1.997887511002016e-05, "loss": 1.4731, "step": 1834 }, { "epoch": 0.05, "learning_rate": 1.9978817608538545e-05, "loss": 1.5205, "step": 1835 }, { "epoch": 0.05, "learning_rate": 1.9978760028987358e-05, "loss": 1.5183, "step": 1836 }, { "epoch": 0.05, "learning_rate": 1.997870237136704e-05, "loss": 1.5967, "step": 1837 }, { "epoch": 0.05, "learning_rate": 1.997864463567805e-05, "loss": 1.5435, "step": 1838 }, { "epoch": 0.05, "learning_rate": 1.9978586821920837e-05, "loss": 1.8086, "step": 1839 }, { "epoch": 0.05, "learning_rate": 1.9978528930095856e-05, "loss": 1.5979, "step": 1840 }, { "epoch": 0.05, "learning_rate": 1.9978470960203552e-05, "loss": 1.6323, "step": 1841 }, { "epoch": 0.05, "learning_rate": 1.9978412912244385e-05, "loss": 1.5952, "step": 1842 }, { "epoch": 0.05, "learning_rate": 1.9978354786218807e-05, "loss": 1.6338, "step": 1843 }, { "epoch": 0.05, "learning_rate": 1.9978296582127273e-05, "loss": 1.501, "step": 1844 }, { "epoch": 0.05, "learning_rate": 1.9978238299970242e-05, "loss": 1.4675, "step": 1845 }, { "epoch": 0.05, "learning_rate": 1.9978179939748164e-05, "loss": 1.5815, "step": 1846 }, { "epoch": 0.05, "learning_rate": 1.9978121501461498e-05, "loss": 1.4307, "step": 1847 }, { "epoch": 0.05, "learning_rate": 1.9978062985110702e-05, "loss": 1.5083, "step": 1848 }, { "epoch": 0.05, "learning_rate": 1.9978004390696232e-05, "loss": 1.6792, "step": 1849 }, { "epoch": 0.05, "learning_rate": 1.997794571821855e-05, "loss": 1.6055, "step": 1850 }, { "epoch": 0.05, "learning_rate": 1.9977886967678112e-05, "loss": 1.5737, "step": 1851 }, { "epoch": 0.05, "learning_rate": 1.9977828139075377e-05, "loss": 1.5493, "step": 1852 }, { "epoch": 0.05, "learning_rate": 1.9977769232410806e-05, "loss": 1.5659, "step": 1853 }, { "epoch": 0.05, "learning_rate": 1.9977710247684862e-05, "loss": 1.4873, "step": 1854 }, { "epoch": 0.05, "learning_rate": 1.9977651184898005e-05, "loss": 1.3098, "step": 1855 }, { "epoch": 0.05, "learning_rate": 1.99775920440507e-05, "loss": 1.5234, "step": 1856 }, { "epoch": 0.05, "learning_rate": 1.99775328251434e-05, "loss": 1.6182, "step": 1857 }, { "epoch": 0.05, "learning_rate": 1.997747352817658e-05, "loss": 1.5576, "step": 1858 }, { "epoch": 0.05, "learning_rate": 1.9977414153150697e-05, "loss": 1.582, "step": 1859 }, { "epoch": 0.05, "learning_rate": 1.9977354700066216e-05, "loss": 1.5303, "step": 1860 }, { "epoch": 0.05, "learning_rate": 1.9977295168923603e-05, "loss": 1.4897, "step": 1861 }, { "epoch": 0.05, "learning_rate": 1.9977235559723327e-05, "loss": 1.7065, "step": 1862 }, { "epoch": 0.05, "learning_rate": 1.997717587246585e-05, "loss": 1.623, "step": 1863 }, { "epoch": 0.05, "learning_rate": 1.9977116107151642e-05, "loss": 1.5898, "step": 1864 }, { "epoch": 0.05, "learning_rate": 1.997705626378117e-05, "loss": 1.541, "step": 1865 }, { "epoch": 0.05, "learning_rate": 1.99769963423549e-05, "loss": 1.418, "step": 1866 }, { "epoch": 0.05, "learning_rate": 1.99769363428733e-05, "loss": 1.4644, "step": 1867 }, { "epoch": 0.05, "learning_rate": 1.9976876265336845e-05, "loss": 1.5249, "step": 1868 }, { "epoch": 0.05, "learning_rate": 1.9976816109746e-05, "loss": 1.8496, "step": 1869 }, { "epoch": 0.05, "learning_rate": 1.9976755876101236e-05, "loss": 1.5825, "step": 1870 }, { "epoch": 0.05, "learning_rate": 1.9976695564403024e-05, "loss": 1.5488, "step": 1871 }, { "epoch": 0.05, "learning_rate": 1.9976635174651845e-05, "loss": 1.8276, "step": 1872 }, { "epoch": 0.05, "learning_rate": 1.9976574706848154e-05, "loss": 1.6387, "step": 1873 }, { "epoch": 0.05, "learning_rate": 1.997651416099244e-05, "loss": 1.5688, "step": 1874 }, { "epoch": 0.05, "learning_rate": 1.997645353708517e-05, "loss": 1.4482, "step": 1875 }, { "epoch": 0.05, "learning_rate": 1.9976392835126817e-05, "loss": 1.5996, "step": 1876 }, { "epoch": 0.05, "learning_rate": 1.9976332055117858e-05, "loss": 1.5952, "step": 1877 }, { "epoch": 0.05, "learning_rate": 1.997627119705877e-05, "loss": 1.8057, "step": 1878 }, { "epoch": 0.05, "learning_rate": 1.9976210260950025e-05, "loss": 1.564, "step": 1879 }, { "epoch": 0.05, "learning_rate": 1.9976149246792103e-05, "loss": 1.5691, "step": 1880 }, { "epoch": 0.05, "learning_rate": 1.997608815458548e-05, "loss": 1.458, "step": 1881 }, { "epoch": 0.05, "learning_rate": 1.9976026984330633e-05, "loss": 1.5098, "step": 1882 }, { "epoch": 0.05, "learning_rate": 1.9975965736028047e-05, "loss": 1.6899, "step": 1883 }, { "epoch": 0.05, "learning_rate": 1.9975904409678192e-05, "loss": 1.3894, "step": 1884 }, { "epoch": 0.05, "learning_rate": 1.9975843005281552e-05, "loss": 1.5479, "step": 1885 }, { "epoch": 0.05, "learning_rate": 1.9975781522838606e-05, "loss": 1.564, "step": 1886 }, { "epoch": 0.05, "learning_rate": 1.997571996234984e-05, "loss": 1.708, "step": 1887 }, { "epoch": 0.05, "learning_rate": 1.997565832381573e-05, "loss": 1.5337, "step": 1888 }, { "epoch": 0.05, "learning_rate": 1.997559660723676e-05, "loss": 1.5391, "step": 1889 }, { "epoch": 0.05, "learning_rate": 1.9975534812613416e-05, "loss": 1.5691, "step": 1890 }, { "epoch": 0.05, "learning_rate": 1.9975472939946172e-05, "loss": 1.2803, "step": 1891 }, { "epoch": 0.05, "learning_rate": 1.9975410989235524e-05, "loss": 1.3704, "step": 1892 }, { "epoch": 0.05, "learning_rate": 1.9975348960481948e-05, "loss": 1.5206, "step": 1893 }, { "epoch": 0.05, "learning_rate": 1.9975286853685937e-05, "loss": 1.5576, "step": 1894 }, { "epoch": 0.05, "learning_rate": 1.9975224668847966e-05, "loss": 1.5112, "step": 1895 }, { "epoch": 0.05, "learning_rate": 1.9975162405968534e-05, "loss": 1.5942, "step": 1896 }, { "epoch": 0.05, "learning_rate": 1.997510006504812e-05, "loss": 1.5166, "step": 1897 }, { "epoch": 0.05, "learning_rate": 1.997503764608721e-05, "loss": 1.3428, "step": 1898 }, { "epoch": 0.05, "learning_rate": 1.9974975149086302e-05, "loss": 1.5906, "step": 1899 }, { "epoch": 0.05, "learning_rate": 1.9974912574045874e-05, "loss": 1.574, "step": 1900 }, { "epoch": 0.05, "learning_rate": 1.9974849920966423e-05, "loss": 1.5991, "step": 1901 }, { "epoch": 0.05, "learning_rate": 1.9974787189848434e-05, "loss": 1.4756, "step": 1902 }, { "epoch": 0.05, "learning_rate": 1.9974724380692405e-05, "loss": 1.5674, "step": 1903 }, { "epoch": 0.05, "learning_rate": 1.997466149349882e-05, "loss": 1.5522, "step": 1904 }, { "epoch": 0.05, "learning_rate": 1.9974598528268176e-05, "loss": 1.491, "step": 1905 }, { "epoch": 0.05, "learning_rate": 1.997453548500096e-05, "loss": 1.5498, "step": 1906 }, { "epoch": 0.05, "learning_rate": 1.9974472363697672e-05, "loss": 1.5557, "step": 1907 }, { "epoch": 0.05, "learning_rate": 1.9974409164358803e-05, "loss": 1.6177, "step": 1908 }, { "epoch": 0.05, "learning_rate": 1.9974345886984844e-05, "loss": 1.6772, "step": 1909 }, { "epoch": 0.05, "learning_rate": 1.9974282531576296e-05, "loss": 1.9443, "step": 1910 }, { "epoch": 0.05, "learning_rate": 1.997421909813365e-05, "loss": 1.7441, "step": 1911 }, { "epoch": 0.05, "learning_rate": 1.99741555866574e-05, "loss": 1.52, "step": 1912 }, { "epoch": 0.05, "learning_rate": 1.9974091997148054e-05, "loss": 1.5972, "step": 1913 }, { "epoch": 0.05, "learning_rate": 1.9974028329606096e-05, "loss": 1.4946, "step": 1914 }, { "epoch": 0.05, "learning_rate": 1.9973964584032036e-05, "loss": 1.5164, "step": 1915 }, { "epoch": 0.05, "learning_rate": 1.9973900760426365e-05, "loss": 1.6938, "step": 1916 }, { "epoch": 0.05, "learning_rate": 1.9973836858789585e-05, "loss": 1.6841, "step": 1917 }, { "epoch": 0.05, "learning_rate": 1.9973772879122193e-05, "loss": 1.5479, "step": 1918 }, { "epoch": 0.05, "learning_rate": 1.9973708821424695e-05, "loss": 1.5298, "step": 1919 }, { "epoch": 0.05, "learning_rate": 1.9973644685697587e-05, "loss": 1.5244, "step": 1920 }, { "epoch": 0.05, "learning_rate": 1.9973580471941374e-05, "loss": 1.5767, "step": 1921 }, { "epoch": 0.05, "learning_rate": 1.9973516180156557e-05, "loss": 1.5002, "step": 1922 }, { "epoch": 0.05, "learning_rate": 1.997345181034364e-05, "loss": 1.5916, "step": 1923 }, { "epoch": 0.05, "learning_rate": 1.9973387362503124e-05, "loss": 1.4578, "step": 1924 }, { "epoch": 0.05, "learning_rate": 1.9973322836635517e-05, "loss": 1.5576, "step": 1925 }, { "epoch": 0.05, "learning_rate": 1.9973258232741322e-05, "loss": 1.4824, "step": 1926 }, { "epoch": 0.05, "learning_rate": 1.9973193550821044e-05, "loss": 1.5591, "step": 1927 }, { "epoch": 0.05, "learning_rate": 1.9973128790875188e-05, "loss": 1.6213, "step": 1928 }, { "epoch": 0.05, "learning_rate": 1.9973063952904265e-05, "loss": 1.6089, "step": 1929 }, { "epoch": 0.05, "learning_rate": 1.9972999036908777e-05, "loss": 1.373, "step": 1930 }, { "epoch": 0.05, "learning_rate": 1.9972934042889235e-05, "loss": 1.5649, "step": 1931 }, { "epoch": 0.05, "learning_rate": 1.9972868970846147e-05, "loss": 1.6875, "step": 1932 }, { "epoch": 0.05, "learning_rate": 1.997280382078002e-05, "loss": 1.395, "step": 1933 }, { "epoch": 0.05, "learning_rate": 1.997273859269137e-05, "loss": 1.5415, "step": 1934 }, { "epoch": 0.05, "learning_rate": 1.9972673286580698e-05, "loss": 1.6287, "step": 1935 }, { "epoch": 0.05, "learning_rate": 1.9972607902448518e-05, "loss": 1.6033, "step": 1936 }, { "epoch": 0.05, "learning_rate": 1.997254244029535e-05, "loss": 1.5327, "step": 1937 }, { "epoch": 0.05, "learning_rate": 1.9972476900121693e-05, "loss": 1.542, "step": 1938 }, { "epoch": 0.05, "learning_rate": 1.9972411281928068e-05, "loss": 1.4561, "step": 1939 }, { "epoch": 0.05, "learning_rate": 1.9972345585714987e-05, "loss": 1.583, "step": 1940 }, { "epoch": 0.05, "learning_rate": 1.9972279811482965e-05, "loss": 1.5571, "step": 1941 }, { "epoch": 0.05, "learning_rate": 1.9972213959232514e-05, "loss": 1.3665, "step": 1942 }, { "epoch": 0.05, "learning_rate": 1.997214802896415e-05, "loss": 1.626, "step": 1943 }, { "epoch": 0.05, "learning_rate": 1.9972082020678387e-05, "loss": 1.5869, "step": 1944 }, { "epoch": 0.05, "learning_rate": 1.9972015934375745e-05, "loss": 1.4358, "step": 1945 }, { "epoch": 0.05, "learning_rate": 1.997194977005674e-05, "loss": 1.7769, "step": 1946 }, { "epoch": 0.05, "learning_rate": 1.997188352772189e-05, "loss": 1.5942, "step": 1947 }, { "epoch": 0.05, "learning_rate": 1.997181720737171e-05, "loss": 1.4373, "step": 1948 }, { "epoch": 0.05, "learning_rate": 1.9971750809006725e-05, "loss": 1.6948, "step": 1949 }, { "epoch": 0.05, "learning_rate": 1.9971684332627446e-05, "loss": 1.4565, "step": 1950 }, { "epoch": 0.05, "learning_rate": 1.9971617778234404e-05, "loss": 1.6479, "step": 1951 }, { "epoch": 0.05, "learning_rate": 1.997155114582811e-05, "loss": 1.5366, "step": 1952 }, { "epoch": 0.05, "learning_rate": 1.9971484435409087e-05, "loss": 1.626, "step": 1953 }, { "epoch": 0.05, "learning_rate": 1.9971417646977856e-05, "loss": 1.5825, "step": 1954 }, { "epoch": 0.05, "learning_rate": 1.9971350780534952e-05, "loss": 1.5796, "step": 1955 }, { "epoch": 0.05, "learning_rate": 1.997128383608088e-05, "loss": 1.5981, "step": 1956 }, { "epoch": 0.05, "learning_rate": 1.9971216813616176e-05, "loss": 1.5984, "step": 1957 }, { "epoch": 0.05, "learning_rate": 1.9971149713141358e-05, "loss": 1.5413, "step": 1958 }, { "epoch": 0.05, "learning_rate": 1.9971082534656958e-05, "loss": 1.5042, "step": 1959 }, { "epoch": 0.05, "learning_rate": 1.997101527816349e-05, "loss": 1.3928, "step": 1960 }, { "epoch": 0.05, "learning_rate": 1.997094794366149e-05, "loss": 1.4451, "step": 1961 }, { "epoch": 0.05, "learning_rate": 1.9970880531151485e-05, "loss": 1.3706, "step": 1962 }, { "epoch": 0.05, "learning_rate": 1.9970813040633998e-05, "loss": 1.5674, "step": 1963 }, { "epoch": 0.05, "learning_rate": 1.9970745472109553e-05, "loss": 1.5645, "step": 1964 }, { "epoch": 0.05, "learning_rate": 1.997067782557869e-05, "loss": 1.7095, "step": 1965 }, { "epoch": 0.05, "learning_rate": 1.9970610101041932e-05, "loss": 1.4175, "step": 1966 }, { "epoch": 0.05, "learning_rate": 1.9970542298499807e-05, "loss": 1.4888, "step": 1967 }, { "epoch": 0.05, "learning_rate": 1.9970474417952846e-05, "loss": 1.5454, "step": 1968 }, { "epoch": 0.05, "learning_rate": 1.9970406459401584e-05, "loss": 1.5293, "step": 1969 }, { "epoch": 0.05, "learning_rate": 1.9970338422846553e-05, "loss": 1.5151, "step": 1970 }, { "epoch": 0.05, "learning_rate": 1.997027030828828e-05, "loss": 1.5181, "step": 1971 }, { "epoch": 0.05, "learning_rate": 1.9970202115727302e-05, "loss": 1.3792, "step": 1972 }, { "epoch": 0.05, "learning_rate": 1.997013384516415e-05, "loss": 1.6292, "step": 1973 }, { "epoch": 0.05, "learning_rate": 1.9970065496599355e-05, "loss": 1.5913, "step": 1974 }, { "epoch": 0.05, "learning_rate": 1.996999707003346e-05, "loss": 1.5327, "step": 1975 }, { "epoch": 0.05, "learning_rate": 1.9969928565466995e-05, "loss": 1.4016, "step": 1976 }, { "epoch": 0.05, "learning_rate": 1.99698599829005e-05, "loss": 1.5945, "step": 1977 }, { "epoch": 0.05, "learning_rate": 1.9969791322334504e-05, "loss": 1.4365, "step": 1978 }, { "epoch": 0.05, "learning_rate": 1.996972258376955e-05, "loss": 1.5234, "step": 1979 }, { "epoch": 0.05, "learning_rate": 1.9969653767206175e-05, "loss": 1.376, "step": 1980 }, { "epoch": 0.05, "learning_rate": 1.996958487264492e-05, "loss": 1.5112, "step": 1981 }, { "epoch": 0.05, "learning_rate": 1.9969515900086317e-05, "loss": 1.4641, "step": 1982 }, { "epoch": 0.05, "learning_rate": 1.996944684953091e-05, "loss": 1.6172, "step": 1983 }, { "epoch": 0.05, "learning_rate": 1.9969377720979238e-05, "loss": 1.4956, "step": 1984 }, { "epoch": 0.05, "learning_rate": 1.9969308514431848e-05, "loss": 1.5073, "step": 1985 }, { "epoch": 0.05, "learning_rate": 1.996923922988927e-05, "loss": 1.5823, "step": 1986 }, { "epoch": 0.05, "learning_rate": 1.9969169867352055e-05, "loss": 1.5718, "step": 1987 }, { "epoch": 0.05, "learning_rate": 1.996910042682074e-05, "loss": 1.5884, "step": 1988 }, { "epoch": 0.05, "learning_rate": 1.9969030908295876e-05, "loss": 1.6553, "step": 1989 }, { "epoch": 0.05, "learning_rate": 1.9968961311778003e-05, "loss": 1.5806, "step": 1990 }, { "epoch": 0.05, "learning_rate": 1.996889163726766e-05, "loss": 1.5022, "step": 1991 }, { "epoch": 0.05, "learning_rate": 1.9968821884765397e-05, "loss": 1.5552, "step": 1992 }, { "epoch": 0.05, "learning_rate": 1.996875205427176e-05, "loss": 1.6797, "step": 1993 }, { "epoch": 0.05, "learning_rate": 1.9968682145787294e-05, "loss": 1.4978, "step": 1994 }, { "epoch": 0.05, "learning_rate": 1.9968612159312545e-05, "loss": 1.541, "step": 1995 }, { "epoch": 0.05, "learning_rate": 1.9968542094848065e-05, "loss": 1.399, "step": 1996 }, { "epoch": 0.05, "learning_rate": 1.9968471952394397e-05, "loss": 1.5376, "step": 1997 }, { "epoch": 0.05, "learning_rate": 1.9968401731952093e-05, "loss": 1.4335, "step": 1998 }, { "epoch": 0.05, "learning_rate": 1.9968331433521703e-05, "loss": 1.5359, "step": 1999 }, { "epoch": 0.05, "learning_rate": 1.9968261057103773e-05, "loss": 1.5708, "step": 2000 }, { "epoch": 0.05, "learning_rate": 1.9968190602698856e-05, "loss": 1.5815, "step": 2001 }, { "epoch": 0.05, "learning_rate": 1.9968120070307503e-05, "loss": 1.6318, "step": 2002 }, { "epoch": 0.05, "learning_rate": 1.9968049459930268e-05, "loss": 1.4526, "step": 2003 }, { "epoch": 0.05, "learning_rate": 1.99679787715677e-05, "loss": 1.4482, "step": 2004 }, { "epoch": 0.05, "learning_rate": 1.996790800522035e-05, "loss": 1.3645, "step": 2005 }, { "epoch": 0.05, "learning_rate": 1.996783716088878e-05, "loss": 1.5811, "step": 2006 }, { "epoch": 0.05, "learning_rate": 1.9967766238573537e-05, "loss": 1.8076, "step": 2007 }, { "epoch": 0.05, "learning_rate": 1.996769523827518e-05, "loss": 1.5425, "step": 2008 }, { "epoch": 0.05, "learning_rate": 1.9967624159994262e-05, "loss": 1.5549, "step": 2009 }, { "epoch": 0.05, "learning_rate": 1.9967553003731336e-05, "loss": 1.4736, "step": 2010 }, { "epoch": 0.05, "learning_rate": 1.9967481769486965e-05, "loss": 1.4585, "step": 2011 }, { "epoch": 0.05, "learning_rate": 1.9967410457261706e-05, "loss": 1.6138, "step": 2012 }, { "epoch": 0.05, "learning_rate": 1.996733906705611e-05, "loss": 1.564, "step": 2013 }, { "epoch": 0.06, "learning_rate": 1.9967267598870743e-05, "loss": 1.2927, "step": 2014 }, { "epoch": 0.06, "learning_rate": 1.996719605270616e-05, "loss": 1.4819, "step": 2015 }, { "epoch": 0.06, "learning_rate": 1.9967124428562923e-05, "loss": 1.6587, "step": 2016 }, { "epoch": 0.06, "learning_rate": 1.9967052726441594e-05, "loss": 1.645, "step": 2017 }, { "epoch": 0.06, "learning_rate": 1.9966980946342728e-05, "loss": 1.4595, "step": 2018 }, { "epoch": 0.06, "learning_rate": 1.996690908826689e-05, "loss": 1.4932, "step": 2019 }, { "epoch": 0.06, "learning_rate": 1.996683715221464e-05, "loss": 1.5581, "step": 2020 }, { "epoch": 0.06, "learning_rate": 1.996676513818655e-05, "loss": 1.4741, "step": 2021 }, { "epoch": 0.06, "learning_rate": 1.9966693046183168e-05, "loss": 1.5229, "step": 2022 }, { "epoch": 0.06, "learning_rate": 1.9966620876205068e-05, "loss": 1.728, "step": 2023 }, { "epoch": 0.06, "learning_rate": 1.9966548628252815e-05, "loss": 1.4668, "step": 2024 }, { "epoch": 0.06, "learning_rate": 1.9966476302326974e-05, "loss": 1.4736, "step": 2025 }, { "epoch": 0.06, "learning_rate": 1.9966403898428105e-05, "loss": 1.4956, "step": 2026 }, { "epoch": 0.06, "learning_rate": 1.996633141655678e-05, "loss": 1.5679, "step": 2027 }, { "epoch": 0.06, "learning_rate": 1.996625885671357e-05, "loss": 1.5669, "step": 2028 }, { "epoch": 0.06, "learning_rate": 1.9966186218899027e-05, "loss": 1.6123, "step": 2029 }, { "epoch": 0.06, "learning_rate": 1.9966113503113736e-05, "loss": 1.5723, "step": 2030 }, { "epoch": 0.06, "learning_rate": 1.9966040709358256e-05, "loss": 1.5146, "step": 2031 }, { "epoch": 0.06, "learning_rate": 1.9965967837633163e-05, "loss": 1.5112, "step": 2032 }, { "epoch": 0.06, "learning_rate": 1.9965894887939023e-05, "loss": 1.4507, "step": 2033 }, { "epoch": 0.06, "learning_rate": 1.9965821860276408e-05, "loss": 1.5991, "step": 2034 }, { "epoch": 0.06, "learning_rate": 1.9965748754645887e-05, "loss": 1.4175, "step": 2035 }, { "epoch": 0.06, "learning_rate": 1.9965675571048037e-05, "loss": 1.5032, "step": 2036 }, { "epoch": 0.06, "learning_rate": 1.9965602309483423e-05, "loss": 1.4707, "step": 2037 }, { "epoch": 0.06, "learning_rate": 1.9965528969952624e-05, "loss": 1.5732, "step": 2038 }, { "epoch": 0.06, "learning_rate": 1.9965455552456214e-05, "loss": 1.7275, "step": 2039 }, { "epoch": 0.06, "learning_rate": 1.9965382056994768e-05, "loss": 1.5601, "step": 2040 }, { "epoch": 0.06, "learning_rate": 1.9965308483568855e-05, "loss": 1.5581, "step": 2041 }, { "epoch": 0.06, "learning_rate": 1.9965234832179055e-05, "loss": 1.5251, "step": 2042 }, { "epoch": 0.06, "learning_rate": 1.9965161102825944e-05, "loss": 1.4668, "step": 2043 }, { "epoch": 0.06, "learning_rate": 1.99650872955101e-05, "loss": 1.5386, "step": 2044 }, { "epoch": 0.06, "learning_rate": 1.99650134102321e-05, "loss": 1.5151, "step": 2045 }, { "epoch": 0.06, "learning_rate": 1.996493944699252e-05, "loss": 1.6572, "step": 2046 }, { "epoch": 0.06, "learning_rate": 1.9964865405791937e-05, "loss": 1.5554, "step": 2047 }, { "epoch": 0.06, "learning_rate": 1.9964791286630933e-05, "loss": 1.6631, "step": 2048 }, { "epoch": 0.06, "learning_rate": 1.996471708951009e-05, "loss": 1.5933, "step": 2049 }, { "epoch": 0.06, "learning_rate": 1.9964642814429985e-05, "loss": 1.6367, "step": 2050 }, { "epoch": 0.06, "learning_rate": 1.99645684613912e-05, "loss": 1.5017, "step": 2051 }, { "epoch": 0.06, "learning_rate": 1.996449403039432e-05, "loss": 1.4885, "step": 2052 }, { "epoch": 0.06, "learning_rate": 1.9964419521439923e-05, "loss": 1.8506, "step": 2053 }, { "epoch": 0.06, "learning_rate": 1.996434493452859e-05, "loss": 1.5322, "step": 2054 }, { "epoch": 0.06, "learning_rate": 1.996427026966091e-05, "loss": 1.5601, "step": 2055 }, { "epoch": 0.06, "learning_rate": 1.9964195526837465e-05, "loss": 1.4873, "step": 2056 }, { "epoch": 0.06, "learning_rate": 1.996412070605884e-05, "loss": 1.4282, "step": 2057 }, { "epoch": 0.06, "learning_rate": 1.9964045807325622e-05, "loss": 1.5708, "step": 2058 }, { "epoch": 0.06, "learning_rate": 1.996397083063839e-05, "loss": 1.5083, "step": 2059 }, { "epoch": 0.06, "learning_rate": 1.9963895775997742e-05, "loss": 1.6128, "step": 2060 }, { "epoch": 0.06, "learning_rate": 1.9963820643404253e-05, "loss": 1.8169, "step": 2061 }, { "epoch": 0.06, "learning_rate": 1.996374543285852e-05, "loss": 1.5737, "step": 2062 }, { "epoch": 0.06, "learning_rate": 1.9963670144361128e-05, "loss": 1.3765, "step": 2063 }, { "epoch": 0.06, "learning_rate": 1.9963594777912663e-05, "loss": 1.4619, "step": 2064 }, { "epoch": 0.06, "learning_rate": 1.9963519333513722e-05, "loss": 1.4919, "step": 2065 }, { "epoch": 0.06, "learning_rate": 1.9963443811164887e-05, "loss": 1.4282, "step": 2066 }, { "epoch": 0.06, "learning_rate": 1.9963368210866753e-05, "loss": 1.6953, "step": 2067 }, { "epoch": 0.06, "learning_rate": 1.9963292532619915e-05, "loss": 1.5112, "step": 2068 }, { "epoch": 0.06, "learning_rate": 1.9963216776424958e-05, "loss": 1.5918, "step": 2069 }, { "epoch": 0.06, "learning_rate": 1.9963140942282478e-05, "loss": 1.6382, "step": 2070 }, { "epoch": 0.06, "learning_rate": 1.996306503019307e-05, "loss": 1.5356, "step": 2071 }, { "epoch": 0.06, "learning_rate": 1.9962989040157326e-05, "loss": 1.5259, "step": 2072 }, { "epoch": 0.06, "learning_rate": 1.996291297217584e-05, "loss": 1.5928, "step": 2073 }, { "epoch": 0.06, "learning_rate": 1.9962836826249205e-05, "loss": 1.585, "step": 2074 }, { "epoch": 0.06, "learning_rate": 1.9962760602378023e-05, "loss": 1.5327, "step": 2075 }, { "epoch": 0.06, "learning_rate": 1.9962684300562886e-05, "loss": 1.7197, "step": 2076 }, { "epoch": 0.06, "learning_rate": 1.996260792080439e-05, "loss": 1.4839, "step": 2077 }, { "epoch": 0.06, "learning_rate": 1.996253146310314e-05, "loss": 1.3652, "step": 2078 }, { "epoch": 0.06, "learning_rate": 1.9962454927459723e-05, "loss": 1.6602, "step": 2079 }, { "epoch": 0.06, "learning_rate": 1.9962378313874744e-05, "loss": 1.5391, "step": 2080 }, { "epoch": 0.06, "learning_rate": 1.9962301622348804e-05, "loss": 1.4146, "step": 2081 }, { "epoch": 0.06, "learning_rate": 1.99622248528825e-05, "loss": 1.4695, "step": 2082 }, { "epoch": 0.06, "learning_rate": 1.9962148005476432e-05, "loss": 1.4834, "step": 2083 }, { "epoch": 0.06, "learning_rate": 1.9962071080131205e-05, "loss": 1.4861, "step": 2084 }, { "epoch": 0.06, "learning_rate": 1.9961994076847416e-05, "loss": 1.4788, "step": 2085 }, { "epoch": 0.06, "learning_rate": 1.996191699562567e-05, "loss": 1.5107, "step": 2086 }, { "epoch": 0.06, "learning_rate": 1.996183983646657e-05, "loss": 1.6182, "step": 2087 }, { "epoch": 0.06, "learning_rate": 1.996176259937072e-05, "loss": 1.4961, "step": 2088 }, { "epoch": 0.06, "learning_rate": 1.9961685284338723e-05, "loss": 1.731, "step": 2089 }, { "epoch": 0.06, "learning_rate": 1.9961607891371186e-05, "loss": 1.7612, "step": 2090 }, { "epoch": 0.06, "learning_rate": 1.9961530420468714e-05, "loss": 1.5098, "step": 2091 }, { "epoch": 0.06, "learning_rate": 1.996145287163191e-05, "loss": 1.5962, "step": 2092 }, { "epoch": 0.06, "learning_rate": 1.9961375244861382e-05, "loss": 1.5566, "step": 2093 }, { "epoch": 0.06, "learning_rate": 1.9961297540157742e-05, "loss": 1.4812, "step": 2094 }, { "epoch": 0.06, "learning_rate": 1.9961219757521592e-05, "loss": 1.6304, "step": 2095 }, { "epoch": 0.06, "learning_rate": 1.9961141896953542e-05, "loss": 1.6348, "step": 2096 }, { "epoch": 0.06, "learning_rate": 1.9961063958454202e-05, "loss": 1.5928, "step": 2097 }, { "epoch": 0.06, "learning_rate": 1.9960985942024185e-05, "loss": 1.501, "step": 2098 }, { "epoch": 0.06, "learning_rate": 1.9960907847664095e-05, "loss": 1.5039, "step": 2099 }, { "epoch": 0.06, "learning_rate": 1.9960829675374548e-05, "loss": 1.645, "step": 2100 }, { "epoch": 0.06, "learning_rate": 1.996075142515615e-05, "loss": 1.6768, "step": 2101 }, { "epoch": 0.06, "learning_rate": 1.9960673097009518e-05, "loss": 1.2664, "step": 2102 }, { "epoch": 0.06, "learning_rate": 1.996059469093526e-05, "loss": 1.4387, "step": 2103 }, { "epoch": 0.06, "learning_rate": 1.9960516206933998e-05, "loss": 1.6394, "step": 2104 }, { "epoch": 0.06, "learning_rate": 1.9960437645006344e-05, "loss": 1.5684, "step": 2105 }, { "epoch": 0.06, "learning_rate": 1.9960359005152905e-05, "loss": 1.5508, "step": 2106 }, { "epoch": 0.06, "learning_rate": 1.99602802873743e-05, "loss": 1.6187, "step": 2107 }, { "epoch": 0.06, "learning_rate": 1.996020149167115e-05, "loss": 1.5605, "step": 2108 }, { "epoch": 0.06, "learning_rate": 1.9960122618044064e-05, "loss": 1.5955, "step": 2109 }, { "epoch": 0.06, "learning_rate": 1.9960043666493658e-05, "loss": 1.7056, "step": 2110 }, { "epoch": 0.06, "learning_rate": 1.995996463702056e-05, "loss": 1.5859, "step": 2111 }, { "epoch": 0.06, "learning_rate": 1.995988552962538e-05, "loss": 1.6133, "step": 2112 }, { "epoch": 0.06, "learning_rate": 1.995980634430874e-05, "loss": 1.5449, "step": 2113 }, { "epoch": 0.06, "learning_rate": 1.995972708107126e-05, "loss": 1.6069, "step": 2114 }, { "epoch": 0.06, "learning_rate": 1.9959647739913555e-05, "loss": 1.5215, "step": 2115 }, { "epoch": 0.06, "learning_rate": 1.995956832083625e-05, "loss": 1.626, "step": 2116 }, { "epoch": 0.06, "learning_rate": 1.995948882383997e-05, "loss": 1.5864, "step": 2117 }, { "epoch": 0.06, "learning_rate": 1.9959409248925326e-05, "loss": 1.4844, "step": 2118 }, { "epoch": 0.06, "learning_rate": 1.9959329596092955e-05, "loss": 1.4778, "step": 2119 }, { "epoch": 0.06, "learning_rate": 1.9959249865343466e-05, "loss": 1.4465, "step": 2120 }, { "epoch": 0.06, "learning_rate": 1.9959170056677493e-05, "loss": 1.7681, "step": 2121 }, { "epoch": 0.06, "learning_rate": 1.9959090170095653e-05, "loss": 1.5103, "step": 2122 }, { "epoch": 0.06, "learning_rate": 1.995901020559858e-05, "loss": 1.7812, "step": 2123 }, { "epoch": 0.06, "learning_rate": 1.995893016318689e-05, "loss": 1.5708, "step": 2124 }, { "epoch": 0.06, "learning_rate": 1.9958850042861212e-05, "loss": 1.5461, "step": 2125 }, { "epoch": 0.06, "learning_rate": 1.9958769844622178e-05, "loss": 1.4707, "step": 2126 }, { "epoch": 0.06, "learning_rate": 1.995868956847041e-05, "loss": 1.5972, "step": 2127 }, { "epoch": 0.06, "learning_rate": 1.995860921440654e-05, "loss": 1.8867, "step": 2128 }, { "epoch": 0.06, "learning_rate": 1.9958528782431193e-05, "loss": 1.6392, "step": 2129 }, { "epoch": 0.06, "learning_rate": 1.9958448272544997e-05, "loss": 1.4851, "step": 2130 }, { "epoch": 0.06, "learning_rate": 1.995836768474859e-05, "loss": 1.5381, "step": 2131 }, { "epoch": 0.06, "learning_rate": 1.995828701904259e-05, "loss": 1.5474, "step": 2132 }, { "epoch": 0.06, "learning_rate": 1.995820627542764e-05, "loss": 1.4539, "step": 2133 }, { "epoch": 0.06, "learning_rate": 1.9958125453904363e-05, "loss": 1.5449, "step": 2134 }, { "epoch": 0.06, "learning_rate": 1.99580445544734e-05, "loss": 1.5149, "step": 2135 }, { "epoch": 0.06, "learning_rate": 1.995796357713538e-05, "loss": 1.5029, "step": 2136 }, { "epoch": 0.06, "learning_rate": 1.995788252189093e-05, "loss": 1.5107, "step": 2137 }, { "epoch": 0.06, "learning_rate": 1.9957801388740692e-05, "loss": 1.5215, "step": 2138 }, { "epoch": 0.06, "learning_rate": 1.9957720177685298e-05, "loss": 1.6128, "step": 2139 }, { "epoch": 0.06, "learning_rate": 1.9957638888725384e-05, "loss": 1.5703, "step": 2140 }, { "epoch": 0.06, "learning_rate": 1.9957557521861586e-05, "loss": 1.4255, "step": 2141 }, { "epoch": 0.06, "learning_rate": 1.995747607709454e-05, "loss": 1.7451, "step": 2142 }, { "epoch": 0.06, "learning_rate": 1.9957394554424884e-05, "loss": 1.5369, "step": 2143 }, { "epoch": 0.06, "learning_rate": 1.9957312953853254e-05, "loss": 1.7285, "step": 2144 }, { "epoch": 0.06, "learning_rate": 1.9957231275380292e-05, "loss": 1.5281, "step": 2145 }, { "epoch": 0.06, "learning_rate": 1.9957149519006634e-05, "loss": 1.3469, "step": 2146 }, { "epoch": 0.06, "learning_rate": 1.995706768473292e-05, "loss": 1.4041, "step": 2147 }, { "epoch": 0.06, "learning_rate": 1.9956985772559786e-05, "loss": 1.502, "step": 2148 }, { "epoch": 0.06, "learning_rate": 1.9956903782487885e-05, "loss": 1.3325, "step": 2149 }, { "epoch": 0.06, "learning_rate": 1.9956821714517847e-05, "loss": 1.5835, "step": 2150 }, { "epoch": 0.06, "learning_rate": 1.995673956865032e-05, "loss": 1.4609, "step": 2151 }, { "epoch": 0.06, "learning_rate": 1.995665734488594e-05, "loss": 1.46, "step": 2152 }, { "epoch": 0.06, "learning_rate": 1.9956575043225358e-05, "loss": 1.4946, "step": 2153 }, { "epoch": 0.06, "learning_rate": 1.9956492663669216e-05, "loss": 1.6089, "step": 2154 }, { "epoch": 0.06, "learning_rate": 1.9956410206218155e-05, "loss": 1.5835, "step": 2155 }, { "epoch": 0.06, "learning_rate": 1.9956327670872823e-05, "loss": 1.6201, "step": 2156 }, { "epoch": 0.06, "learning_rate": 1.9956245057633867e-05, "loss": 1.6929, "step": 2157 }, { "epoch": 0.06, "learning_rate": 1.995616236650193e-05, "loss": 1.6294, "step": 2158 }, { "epoch": 0.06, "learning_rate": 1.995607959747766e-05, "loss": 1.6084, "step": 2159 }, { "epoch": 0.06, "learning_rate": 1.9955996750561704e-05, "loss": 1.5249, "step": 2160 }, { "epoch": 0.06, "learning_rate": 1.9955913825754713e-05, "loss": 1.4651, "step": 2161 }, { "epoch": 0.06, "learning_rate": 1.9955830823057332e-05, "loss": 1.5454, "step": 2162 }, { "epoch": 0.06, "learning_rate": 1.9955747742470214e-05, "loss": 1.4399, "step": 2163 }, { "epoch": 0.06, "learning_rate": 1.995566458399401e-05, "loss": 1.4976, "step": 2164 }, { "epoch": 0.06, "learning_rate": 1.9955581347629363e-05, "loss": 1.4253, "step": 2165 }, { "epoch": 0.06, "learning_rate": 1.995549803337693e-05, "loss": 1.5054, "step": 2166 }, { "epoch": 0.06, "learning_rate": 1.9955414641237362e-05, "loss": 1.5552, "step": 2167 }, { "epoch": 0.06, "learning_rate": 1.9955331171211312e-05, "loss": 1.6582, "step": 2168 }, { "epoch": 0.06, "learning_rate": 1.995524762329943e-05, "loss": 1.6128, "step": 2169 }, { "epoch": 0.06, "learning_rate": 1.9955163997502374e-05, "loss": 1.4414, "step": 2170 }, { "epoch": 0.06, "learning_rate": 1.9955080293820798e-05, "loss": 1.6387, "step": 2171 }, { "epoch": 0.06, "learning_rate": 1.9954996512255352e-05, "loss": 1.7446, "step": 2172 }, { "epoch": 0.06, "learning_rate": 1.9954912652806694e-05, "loss": 1.5903, "step": 2173 }, { "epoch": 0.06, "learning_rate": 1.995482871547548e-05, "loss": 1.3916, "step": 2174 }, { "epoch": 0.06, "learning_rate": 1.995474470026237e-05, "loss": 1.6143, "step": 2175 }, { "epoch": 0.06, "learning_rate": 1.9954660607168014e-05, "loss": 1.4861, "step": 2176 }, { "epoch": 0.06, "learning_rate": 1.995457643619308e-05, "loss": 1.5847, "step": 2177 }, { "epoch": 0.06, "learning_rate": 1.9954492187338218e-05, "loss": 1.5435, "step": 2178 }, { "epoch": 0.06, "learning_rate": 1.995440786060409e-05, "loss": 1.6179, "step": 2179 }, { "epoch": 0.06, "learning_rate": 1.9954323455991357e-05, "loss": 1.5396, "step": 2180 }, { "epoch": 0.06, "learning_rate": 1.995423897350068e-05, "loss": 1.5088, "step": 2181 }, { "epoch": 0.06, "learning_rate": 1.9954154413132714e-05, "loss": 1.5264, "step": 2182 }, { "epoch": 0.06, "learning_rate": 1.9954069774888127e-05, "loss": 1.6377, "step": 2183 }, { "epoch": 0.06, "learning_rate": 1.9953985058767578e-05, "loss": 1.5566, "step": 2184 }, { "epoch": 0.06, "learning_rate": 1.995390026477173e-05, "loss": 1.5996, "step": 2185 }, { "epoch": 0.06, "learning_rate": 1.9953815392901247e-05, "loss": 1.6465, "step": 2186 }, { "epoch": 0.06, "learning_rate": 1.9953730443156793e-05, "loss": 1.6692, "step": 2187 }, { "epoch": 0.06, "learning_rate": 1.9953645415539037e-05, "loss": 1.4434, "step": 2188 }, { "epoch": 0.06, "learning_rate": 1.9953560310048633e-05, "loss": 1.5938, "step": 2189 }, { "epoch": 0.06, "learning_rate": 1.9953475126686255e-05, "loss": 1.4507, "step": 2190 }, { "epoch": 0.06, "learning_rate": 1.995338986545257e-05, "loss": 1.4873, "step": 2191 }, { "epoch": 0.06, "learning_rate": 1.9953304526348244e-05, "loss": 1.3772, "step": 2192 }, { "epoch": 0.06, "learning_rate": 1.9953219109373942e-05, "loss": 1.7979, "step": 2193 }, { "epoch": 0.06, "learning_rate": 1.9953133614530336e-05, "loss": 1.5493, "step": 2194 }, { "epoch": 0.06, "learning_rate": 1.9953048041818093e-05, "loss": 1.7051, "step": 2195 }, { "epoch": 0.06, "learning_rate": 1.9952962391237877e-05, "loss": 1.7051, "step": 2196 }, { "epoch": 0.06, "learning_rate": 1.9952876662790367e-05, "loss": 1.5391, "step": 2197 }, { "epoch": 0.06, "learning_rate": 1.9952790856476235e-05, "loss": 1.4536, "step": 2198 }, { "epoch": 0.06, "learning_rate": 1.995270497229614e-05, "loss": 1.5752, "step": 2199 }, { "epoch": 0.06, "learning_rate": 1.9952619010250767e-05, "loss": 1.4258, "step": 2200 }, { "epoch": 0.06, "learning_rate": 1.9952532970340778e-05, "loss": 1.5337, "step": 2201 }, { "epoch": 0.06, "learning_rate": 1.9952446852566852e-05, "loss": 1.5348, "step": 2202 }, { "epoch": 0.06, "learning_rate": 1.9952360656929666e-05, "loss": 1.4207, "step": 2203 }, { "epoch": 0.06, "learning_rate": 1.9952274383429885e-05, "loss": 1.4961, "step": 2204 }, { "epoch": 0.06, "learning_rate": 1.9952188032068195e-05, "loss": 1.4109, "step": 2205 }, { "epoch": 0.06, "learning_rate": 1.995210160284526e-05, "loss": 1.5098, "step": 2206 }, { "epoch": 0.06, "learning_rate": 1.9952015095761763e-05, "loss": 1.5488, "step": 2207 }, { "epoch": 0.06, "learning_rate": 1.9951928510818382e-05, "loss": 1.6143, "step": 2208 }, { "epoch": 0.06, "learning_rate": 1.995184184801579e-05, "loss": 1.4583, "step": 2209 }, { "epoch": 0.06, "learning_rate": 1.9951755107354668e-05, "loss": 1.5127, "step": 2210 }, { "epoch": 0.06, "learning_rate": 1.9951668288835694e-05, "loss": 1.3394, "step": 2211 }, { "epoch": 0.06, "learning_rate": 1.9951581392459545e-05, "loss": 1.4106, "step": 2212 }, { "epoch": 0.06, "learning_rate": 1.9951494418226906e-05, "loss": 1.5403, "step": 2213 }, { "epoch": 0.06, "learning_rate": 1.995140736613845e-05, "loss": 1.4688, "step": 2214 }, { "epoch": 0.06, "learning_rate": 1.9951320236194864e-05, "loss": 1.4729, "step": 2215 }, { "epoch": 0.06, "learning_rate": 1.9951233028396827e-05, "loss": 1.54, "step": 2216 }, { "epoch": 0.06, "learning_rate": 1.9951145742745027e-05, "loss": 1.5024, "step": 2217 }, { "epoch": 0.06, "learning_rate": 1.9951058379240138e-05, "loss": 1.5239, "step": 2218 }, { "epoch": 0.06, "learning_rate": 1.995097093788285e-05, "loss": 1.4683, "step": 2219 }, { "epoch": 0.06, "learning_rate": 1.995088341867384e-05, "loss": 1.696, "step": 2220 }, { "epoch": 0.06, "learning_rate": 1.9950795821613802e-05, "loss": 1.6406, "step": 2221 }, { "epoch": 0.06, "learning_rate": 1.9950708146703413e-05, "loss": 1.4297, "step": 2222 }, { "epoch": 0.06, "learning_rate": 1.9950620393943365e-05, "loss": 1.6704, "step": 2223 }, { "epoch": 0.06, "learning_rate": 1.995053256333434e-05, "loss": 1.4624, "step": 2224 }, { "epoch": 0.06, "learning_rate": 1.9950444654877033e-05, "loss": 1.4727, "step": 2225 }, { "epoch": 0.06, "learning_rate": 1.995035666857212e-05, "loss": 1.5142, "step": 2226 }, { "epoch": 0.06, "learning_rate": 1.99502686044203e-05, "loss": 1.5933, "step": 2227 }, { "epoch": 0.06, "learning_rate": 1.995018046242225e-05, "loss": 1.5486, "step": 2228 }, { "epoch": 0.06, "learning_rate": 1.9950092242578675e-05, "loss": 1.4365, "step": 2229 }, { "epoch": 0.06, "learning_rate": 1.9950003944890252e-05, "loss": 1.5332, "step": 2230 }, { "epoch": 0.06, "learning_rate": 1.994991556935768e-05, "loss": 1.5259, "step": 2231 }, { "epoch": 0.06, "learning_rate": 1.9949827115981647e-05, "loss": 1.5278, "step": 2232 }, { "epoch": 0.06, "learning_rate": 1.9949738584762843e-05, "loss": 1.7383, "step": 2233 }, { "epoch": 0.06, "learning_rate": 1.9949649975701965e-05, "loss": 1.5391, "step": 2234 }, { "epoch": 0.06, "learning_rate": 1.9949561288799705e-05, "loss": 1.4941, "step": 2235 }, { "epoch": 0.06, "learning_rate": 1.9949472524056753e-05, "loss": 1.707, "step": 2236 }, { "epoch": 0.06, "learning_rate": 1.994938368147381e-05, "loss": 1.4932, "step": 2237 }, { "epoch": 0.06, "learning_rate": 1.9949294761051567e-05, "loss": 1.5388, "step": 2238 }, { "epoch": 0.06, "learning_rate": 1.994920576279072e-05, "loss": 1.5474, "step": 2239 }, { "epoch": 0.06, "learning_rate": 1.9949116686691964e-05, "loss": 1.418, "step": 2240 }, { "epoch": 0.06, "learning_rate": 1.9949027532755998e-05, "loss": 1.5732, "step": 2241 }, { "epoch": 0.06, "learning_rate": 1.9948938300983517e-05, "loss": 1.5732, "step": 2242 }, { "epoch": 0.06, "learning_rate": 1.9948848991375228e-05, "loss": 1.3679, "step": 2243 }, { "epoch": 0.06, "learning_rate": 1.9948759603931814e-05, "loss": 1.6279, "step": 2244 }, { "epoch": 0.06, "learning_rate": 1.994867013865399e-05, "loss": 1.6545, "step": 2245 }, { "epoch": 0.06, "learning_rate": 1.9948580595542447e-05, "loss": 1.4185, "step": 2246 }, { "epoch": 0.06, "learning_rate": 1.9948490974597888e-05, "loss": 1.6013, "step": 2247 }, { "epoch": 0.06, "learning_rate": 1.994840127582101e-05, "loss": 1.3743, "step": 2248 }, { "epoch": 0.06, "learning_rate": 1.9948311499212522e-05, "loss": 1.6147, "step": 2249 }, { "epoch": 0.06, "learning_rate": 1.9948221644773122e-05, "loss": 1.5757, "step": 2250 }, { "epoch": 0.06, "learning_rate": 1.9948131712503513e-05, "loss": 1.5498, "step": 2251 }, { "epoch": 0.06, "learning_rate": 1.99480417024044e-05, "loss": 1.6265, "step": 2252 }, { "epoch": 0.06, "learning_rate": 1.9947951614476486e-05, "loss": 1.6128, "step": 2253 }, { "epoch": 0.06, "learning_rate": 1.9947861448720477e-05, "loss": 1.625, "step": 2254 }, { "epoch": 0.06, "learning_rate": 1.994777120513708e-05, "loss": 1.5308, "step": 2255 }, { "epoch": 0.06, "learning_rate": 1.9947680883726998e-05, "loss": 1.5684, "step": 2256 }, { "epoch": 0.06, "learning_rate": 1.9947590484490934e-05, "loss": 1.5176, "step": 2257 }, { "epoch": 0.06, "learning_rate": 1.9947500007429606e-05, "loss": 1.4233, "step": 2258 }, { "epoch": 0.06, "learning_rate": 1.9947409452543713e-05, "loss": 1.4619, "step": 2259 }, { "epoch": 0.06, "learning_rate": 1.9947318819833964e-05, "loss": 1.5032, "step": 2260 }, { "epoch": 0.06, "learning_rate": 1.994722810930107e-05, "loss": 1.584, "step": 2261 }, { "epoch": 0.06, "learning_rate": 1.9947137320945743e-05, "loss": 1.6309, "step": 2262 }, { "epoch": 0.06, "learning_rate": 1.9947046454768692e-05, "loss": 1.5161, "step": 2263 }, { "epoch": 0.06, "learning_rate": 1.9946955510770626e-05, "loss": 1.479, "step": 2264 }, { "epoch": 0.06, "learning_rate": 1.9946864488952258e-05, "loss": 1.543, "step": 2265 }, { "epoch": 0.06, "learning_rate": 1.99467733893143e-05, "loss": 1.6323, "step": 2266 }, { "epoch": 0.06, "learning_rate": 1.9946682211857462e-05, "loss": 1.6157, "step": 2267 }, { "epoch": 0.06, "learning_rate": 1.9946590956582462e-05, "loss": 1.5552, "step": 2268 }, { "epoch": 0.06, "learning_rate": 1.994649962349001e-05, "loss": 1.5752, "step": 2269 }, { "epoch": 0.06, "learning_rate": 1.9946408212580822e-05, "loss": 1.5481, "step": 2270 }, { "epoch": 0.06, "learning_rate": 1.9946316723855613e-05, "loss": 1.5635, "step": 2271 }, { "epoch": 0.06, "learning_rate": 1.99462251573151e-05, "loss": 1.5859, "step": 2272 }, { "epoch": 0.06, "learning_rate": 1.9946133512959997e-05, "loss": 1.543, "step": 2273 }, { "epoch": 0.06, "learning_rate": 1.9946041790791024e-05, "loss": 1.4858, "step": 2274 }, { "epoch": 0.06, "learning_rate": 1.9945949990808898e-05, "loss": 1.5132, "step": 2275 }, { "epoch": 0.06, "learning_rate": 1.9945858113014334e-05, "loss": 1.4478, "step": 2276 }, { "epoch": 0.06, "learning_rate": 1.9945766157408054e-05, "loss": 1.5664, "step": 2277 }, { "epoch": 0.06, "learning_rate": 1.9945674123990777e-05, "loss": 1.73, "step": 2278 }, { "epoch": 0.06, "learning_rate": 1.994558201276322e-05, "loss": 1.6753, "step": 2279 }, { "epoch": 0.06, "learning_rate": 1.994548982372611e-05, "loss": 1.5469, "step": 2280 }, { "epoch": 0.06, "learning_rate": 1.994539755688016e-05, "loss": 1.6743, "step": 2281 }, { "epoch": 0.06, "learning_rate": 1.9945305212226098e-05, "loss": 1.4924, "step": 2282 }, { "epoch": 0.06, "learning_rate": 1.9945212789764646e-05, "loss": 1.4824, "step": 2283 }, { "epoch": 0.06, "learning_rate": 1.9945120289496523e-05, "loss": 1.5947, "step": 2284 }, { "epoch": 0.06, "learning_rate": 1.9945027711422454e-05, "loss": 1.5117, "step": 2285 }, { "epoch": 0.06, "learning_rate": 1.994493505554317e-05, "loss": 1.2058, "step": 2286 }, { "epoch": 0.06, "learning_rate": 1.9944842321859392e-05, "loss": 1.3765, "step": 2287 }, { "epoch": 0.06, "learning_rate": 1.9944749510371838e-05, "loss": 1.8848, "step": 2288 }, { "epoch": 0.06, "learning_rate": 1.994465662108124e-05, "loss": 1.4912, "step": 2289 }, { "epoch": 0.06, "learning_rate": 1.9944563653988325e-05, "loss": 1.4856, "step": 2290 }, { "epoch": 0.06, "learning_rate": 1.9944470609093826e-05, "loss": 1.7695, "step": 2291 }, { "epoch": 0.06, "learning_rate": 1.9944377486398464e-05, "loss": 1.4146, "step": 2292 }, { "epoch": 0.06, "learning_rate": 1.9944284285902965e-05, "loss": 1.358, "step": 2293 }, { "epoch": 0.06, "learning_rate": 1.9944191007608063e-05, "loss": 1.5273, "step": 2294 }, { "epoch": 0.06, "learning_rate": 1.9944097651514486e-05, "loss": 1.5586, "step": 2295 }, { "epoch": 0.06, "learning_rate": 1.9944004217622966e-05, "loss": 1.4917, "step": 2296 }, { "epoch": 0.06, "learning_rate": 1.9943910705934234e-05, "loss": 1.5671, "step": 2297 }, { "epoch": 0.06, "learning_rate": 1.994381711644902e-05, "loss": 1.301, "step": 2298 }, { "epoch": 0.06, "learning_rate": 1.9943723449168053e-05, "loss": 1.5566, "step": 2299 }, { "epoch": 0.06, "learning_rate": 1.9943629704092074e-05, "loss": 1.7102, "step": 2300 }, { "epoch": 0.06, "learning_rate": 1.994353588122181e-05, "loss": 1.5229, "step": 2301 }, { "epoch": 0.06, "learning_rate": 1.9943441980558e-05, "loss": 1.4846, "step": 2302 }, { "epoch": 0.06, "learning_rate": 1.9943348002101374e-05, "loss": 1.4341, "step": 2303 }, { "epoch": 0.06, "learning_rate": 1.9943253945852667e-05, "loss": 1.6113, "step": 2304 }, { "epoch": 0.06, "learning_rate": 1.994315981181262e-05, "loss": 1.366, "step": 2305 }, { "epoch": 0.06, "learning_rate": 1.9943065599981964e-05, "loss": 1.3289, "step": 2306 }, { "epoch": 0.06, "learning_rate": 1.994297131036144e-05, "loss": 1.627, "step": 2307 }, { "epoch": 0.06, "learning_rate": 1.994287694295178e-05, "loss": 1.458, "step": 2308 }, { "epoch": 0.06, "learning_rate": 1.994278249775373e-05, "loss": 1.5264, "step": 2309 }, { "epoch": 0.06, "learning_rate": 1.9942687974768025e-05, "loss": 1.5264, "step": 2310 }, { "epoch": 0.06, "learning_rate": 1.9942593373995406e-05, "loss": 1.5571, "step": 2311 }, { "epoch": 0.06, "learning_rate": 1.9942498695436607e-05, "loss": 1.2451, "step": 2312 }, { "epoch": 0.06, "learning_rate": 1.9942403939092376e-05, "loss": 1.644, "step": 2313 }, { "epoch": 0.06, "learning_rate": 1.994230910496345e-05, "loss": 1.4834, "step": 2314 }, { "epoch": 0.06, "learning_rate": 1.9942214193050578e-05, "loss": 1.5999, "step": 2315 }, { "epoch": 0.06, "learning_rate": 1.9942119203354493e-05, "loss": 1.3767, "step": 2316 }, { "epoch": 0.06, "learning_rate": 1.9942024135875942e-05, "loss": 1.5376, "step": 2317 }, { "epoch": 0.06, "learning_rate": 1.9941928990615673e-05, "loss": 1.5244, "step": 2318 }, { "epoch": 0.06, "learning_rate": 1.9941833767574423e-05, "loss": 1.5381, "step": 2319 }, { "epoch": 0.06, "learning_rate": 1.9941738466752945e-05, "loss": 1.4697, "step": 2320 }, { "epoch": 0.06, "learning_rate": 1.9941643088151976e-05, "loss": 1.5286, "step": 2321 }, { "epoch": 0.06, "learning_rate": 1.9941547631772267e-05, "loss": 1.353, "step": 2322 }, { "epoch": 0.06, "learning_rate": 1.9941452097614565e-05, "loss": 1.52, "step": 2323 }, { "epoch": 0.06, "learning_rate": 1.9941356485679617e-05, "loss": 1.5173, "step": 2324 }, { "epoch": 0.06, "learning_rate": 1.994126079596817e-05, "loss": 1.4209, "step": 2325 }, { "epoch": 0.06, "learning_rate": 1.994116502848097e-05, "loss": 1.6558, "step": 2326 }, { "epoch": 0.06, "learning_rate": 1.9941069183218773e-05, "loss": 1.394, "step": 2327 }, { "epoch": 0.06, "learning_rate": 1.9940973260182325e-05, "loss": 1.4172, "step": 2328 }, { "epoch": 0.06, "learning_rate": 1.994087725937238e-05, "loss": 1.6763, "step": 2329 }, { "epoch": 0.06, "learning_rate": 1.994078118078968e-05, "loss": 1.7822, "step": 2330 }, { "epoch": 0.06, "learning_rate": 1.9940685024434986e-05, "loss": 1.5303, "step": 2331 }, { "epoch": 0.06, "learning_rate": 1.9940588790309045e-05, "loss": 1.502, "step": 2332 }, { "epoch": 0.06, "learning_rate": 1.9940492478412613e-05, "loss": 1.5469, "step": 2333 }, { "epoch": 0.06, "learning_rate": 1.9940396088746443e-05, "loss": 1.5425, "step": 2334 }, { "epoch": 0.06, "learning_rate": 1.9940299621311284e-05, "loss": 1.6689, "step": 2335 }, { "epoch": 0.06, "learning_rate": 1.99402030761079e-05, "loss": 1.3706, "step": 2336 }, { "epoch": 0.06, "learning_rate": 1.9940106453137042e-05, "loss": 1.5, "step": 2337 }, { "epoch": 0.06, "learning_rate": 1.9940009752399462e-05, "loss": 1.4653, "step": 2338 }, { "epoch": 0.06, "learning_rate": 1.993991297389592e-05, "loss": 1.4551, "step": 2339 }, { "epoch": 0.06, "learning_rate": 1.9939816117627173e-05, "loss": 1.4355, "step": 2340 }, { "epoch": 0.06, "learning_rate": 1.9939719183593978e-05, "loss": 1.5144, "step": 2341 }, { "epoch": 0.06, "learning_rate": 1.9939622171797098e-05, "loss": 1.3965, "step": 2342 }, { "epoch": 0.06, "learning_rate": 1.9939525082237283e-05, "loss": 1.501, "step": 2343 }, { "epoch": 0.06, "learning_rate": 1.99394279149153e-05, "loss": 1.5654, "step": 2344 }, { "epoch": 0.06, "learning_rate": 1.993933066983191e-05, "loss": 1.353, "step": 2345 }, { "epoch": 0.06, "learning_rate": 1.9939233346987864e-05, "loss": 1.4072, "step": 2346 }, { "epoch": 0.06, "learning_rate": 1.9939135946383935e-05, "loss": 1.5278, "step": 2347 }, { "epoch": 0.06, "learning_rate": 1.993903846802088e-05, "loss": 1.2887, "step": 2348 }, { "epoch": 0.06, "learning_rate": 1.993894091189946e-05, "loss": 1.5039, "step": 2349 }, { "epoch": 0.06, "learning_rate": 1.993884327802044e-05, "loss": 1.7217, "step": 2350 }, { "epoch": 0.06, "learning_rate": 1.9938745566384585e-05, "loss": 1.4795, "step": 2351 }, { "epoch": 0.06, "learning_rate": 1.9938647776992655e-05, "loss": 1.5645, "step": 2352 }, { "epoch": 0.06, "learning_rate": 1.993854990984542e-05, "loss": 1.521, "step": 2353 }, { "epoch": 0.06, "learning_rate": 1.9938451964943645e-05, "loss": 1.5825, "step": 2354 }, { "epoch": 0.06, "learning_rate": 1.9938353942288094e-05, "loss": 1.4734, "step": 2355 }, { "epoch": 0.06, "learning_rate": 1.993825584187954e-05, "loss": 1.7358, "step": 2356 }, { "epoch": 0.06, "learning_rate": 1.9938157663718738e-05, "loss": 1.614, "step": 2357 }, { "epoch": 0.06, "learning_rate": 1.9938059407806468e-05, "loss": 1.5715, "step": 2358 }, { "epoch": 0.06, "learning_rate": 1.9937961074143492e-05, "loss": 1.554, "step": 2359 }, { "epoch": 0.06, "learning_rate": 1.9937862662730586e-05, "loss": 1.5308, "step": 2360 }, { "epoch": 0.06, "learning_rate": 1.993776417356851e-05, "loss": 1.449, "step": 2361 }, { "epoch": 0.06, "learning_rate": 1.9937665606658046e-05, "loss": 1.5034, "step": 2362 }, { "epoch": 0.06, "learning_rate": 1.9937566961999954e-05, "loss": 1.3962, "step": 2363 }, { "epoch": 0.06, "learning_rate": 1.9937468239595015e-05, "loss": 1.5471, "step": 2364 }, { "epoch": 0.06, "learning_rate": 1.9937369439443995e-05, "loss": 1.459, "step": 2365 }, { "epoch": 0.06, "learning_rate": 1.993727056154767e-05, "loss": 1.3733, "step": 2366 }, { "epoch": 0.06, "learning_rate": 1.9937171605906815e-05, "loss": 1.439, "step": 2367 }, { "epoch": 0.06, "learning_rate": 1.99370725725222e-05, "loss": 1.5293, "step": 2368 }, { "epoch": 0.06, "learning_rate": 1.99369734613946e-05, "loss": 1.8501, "step": 2369 }, { "epoch": 0.06, "learning_rate": 1.9936874272524795e-05, "loss": 1.4551, "step": 2370 }, { "epoch": 0.06, "learning_rate": 1.993677500591356e-05, "loss": 1.5249, "step": 2371 }, { "epoch": 0.06, "learning_rate": 1.9936675661561666e-05, "loss": 1.4038, "step": 2372 }, { "epoch": 0.06, "learning_rate": 1.9936576239469895e-05, "loss": 1.6016, "step": 2373 }, { "epoch": 0.06, "learning_rate": 1.9936476739639028e-05, "loss": 1.5278, "step": 2374 }, { "epoch": 0.06, "learning_rate": 1.9936377162069836e-05, "loss": 1.4531, "step": 2375 }, { "epoch": 0.06, "learning_rate": 1.9936277506763103e-05, "loss": 1.5469, "step": 2376 }, { "epoch": 0.06, "learning_rate": 1.9936177773719604e-05, "loss": 1.3345, "step": 2377 }, { "epoch": 0.06, "learning_rate": 1.9936077962940127e-05, "loss": 1.4956, "step": 2378 }, { "epoch": 0.06, "learning_rate": 1.9935978074425444e-05, "loss": 1.52, "step": 2379 }, { "epoch": 0.06, "learning_rate": 1.9935878108176343e-05, "loss": 1.5503, "step": 2380 }, { "epoch": 0.07, "learning_rate": 1.99357780641936e-05, "loss": 1.4822, "step": 2381 }, { "epoch": 0.07, "learning_rate": 1.9935677942478005e-05, "loss": 1.9326, "step": 2382 }, { "epoch": 0.07, "learning_rate": 1.993557774303034e-05, "loss": 1.3926, "step": 2383 }, { "epoch": 0.07, "learning_rate": 1.9935477465851387e-05, "loss": 1.4756, "step": 2384 }, { "epoch": 0.07, "learning_rate": 1.9935377110941925e-05, "loss": 1.521, "step": 2385 }, { "epoch": 0.07, "learning_rate": 1.9935276678302747e-05, "loss": 1.4849, "step": 2386 }, { "epoch": 0.07, "learning_rate": 1.993517616793464e-05, "loss": 1.5989, "step": 2387 }, { "epoch": 0.07, "learning_rate": 1.9935075579838383e-05, "loss": 1.5762, "step": 2388 }, { "epoch": 0.07, "learning_rate": 1.9934974914014765e-05, "loss": 1.6143, "step": 2389 }, { "epoch": 0.07, "learning_rate": 1.9934874170464574e-05, "loss": 1.4167, "step": 2390 }, { "epoch": 0.07, "learning_rate": 1.9934773349188604e-05, "loss": 1.5308, "step": 2391 }, { "epoch": 0.07, "learning_rate": 1.9934672450187634e-05, "loss": 1.3762, "step": 2392 }, { "epoch": 0.07, "learning_rate": 1.9934571473462464e-05, "loss": 1.5859, "step": 2393 }, { "epoch": 0.07, "learning_rate": 1.9934470419013875e-05, "loss": 1.6167, "step": 2394 }, { "epoch": 0.07, "learning_rate": 1.993436928684266e-05, "loss": 1.5874, "step": 2395 }, { "epoch": 0.07, "learning_rate": 1.9934268076949615e-05, "loss": 1.4741, "step": 2396 }, { "epoch": 0.07, "learning_rate": 1.9934166789335526e-05, "loss": 1.5063, "step": 2397 }, { "epoch": 0.07, "learning_rate": 1.9934065424001187e-05, "loss": 1.6167, "step": 2398 }, { "epoch": 0.07, "learning_rate": 1.993396398094739e-05, "loss": 1.4963, "step": 2399 }, { "epoch": 0.07, "learning_rate": 1.9933862460174933e-05, "loss": 1.5737, "step": 2400 }, { "epoch": 0.07, "learning_rate": 1.9933760861684604e-05, "loss": 1.604, "step": 2401 }, { "epoch": 0.07, "learning_rate": 1.9933659185477203e-05, "loss": 1.3774, "step": 2402 }, { "epoch": 0.07, "learning_rate": 1.9933557431553523e-05, "loss": 1.5576, "step": 2403 }, { "epoch": 0.07, "learning_rate": 1.9933455599914363e-05, "loss": 1.5164, "step": 2404 }, { "epoch": 0.07, "learning_rate": 1.9933353690560516e-05, "loss": 1.436, "step": 2405 }, { "epoch": 0.07, "learning_rate": 1.993325170349278e-05, "loss": 1.6313, "step": 2406 }, { "epoch": 0.07, "learning_rate": 1.993314963871195e-05, "loss": 1.4368, "step": 2407 }, { "epoch": 0.07, "learning_rate": 1.9933047496218835e-05, "loss": 1.5093, "step": 2408 }, { "epoch": 0.07, "learning_rate": 1.9932945276014227e-05, "loss": 1.5378, "step": 2409 }, { "epoch": 0.07, "learning_rate": 1.9932842978098924e-05, "loss": 1.585, "step": 2410 }, { "epoch": 0.07, "learning_rate": 1.9932740602473725e-05, "loss": 1.5466, "step": 2411 }, { "epoch": 0.07, "learning_rate": 1.993263814913944e-05, "loss": 1.543, "step": 2412 }, { "epoch": 0.07, "learning_rate": 1.9932535618096864e-05, "loss": 1.8418, "step": 2413 }, { "epoch": 0.07, "learning_rate": 1.9932433009346794e-05, "loss": 1.5391, "step": 2414 }, { "epoch": 0.07, "learning_rate": 1.9932330322890045e-05, "loss": 1.4321, "step": 2415 }, { "epoch": 0.07, "learning_rate": 1.9932227558727407e-05, "loss": 1.488, "step": 2416 }, { "epoch": 0.07, "learning_rate": 1.9932124716859698e-05, "loss": 1.4409, "step": 2417 }, { "epoch": 0.07, "learning_rate": 1.9932021797287714e-05, "loss": 1.4407, "step": 2418 }, { "epoch": 0.07, "learning_rate": 1.993191880001226e-05, "loss": 1.5776, "step": 2419 }, { "epoch": 0.07, "learning_rate": 1.9931815725034144e-05, "loss": 1.321, "step": 2420 }, { "epoch": 0.07, "learning_rate": 1.9931712572354173e-05, "loss": 1.8335, "step": 2421 }, { "epoch": 0.07, "learning_rate": 1.9931609341973153e-05, "loss": 1.6416, "step": 2422 }, { "epoch": 0.07, "learning_rate": 1.9931506033891893e-05, "loss": 1.5459, "step": 2423 }, { "epoch": 0.07, "learning_rate": 1.99314026481112e-05, "loss": 1.5869, "step": 2424 }, { "epoch": 0.07, "learning_rate": 1.993129918463188e-05, "loss": 1.5942, "step": 2425 }, { "epoch": 0.07, "learning_rate": 1.9931195643454744e-05, "loss": 1.52, "step": 2426 }, { "epoch": 0.07, "learning_rate": 1.9931092024580606e-05, "loss": 1.469, "step": 2427 }, { "epoch": 0.07, "learning_rate": 1.9930988328010273e-05, "loss": 1.5229, "step": 2428 }, { "epoch": 0.07, "learning_rate": 1.993088455374456e-05, "loss": 1.4167, "step": 2429 }, { "epoch": 0.07, "learning_rate": 1.993078070178427e-05, "loss": 1.478, "step": 2430 }, { "epoch": 0.07, "learning_rate": 1.9930676772130227e-05, "loss": 1.5195, "step": 2431 }, { "epoch": 0.07, "learning_rate": 1.9930572764783238e-05, "loss": 1.4824, "step": 2432 }, { "epoch": 0.07, "learning_rate": 1.9930468679744114e-05, "loss": 1.5378, "step": 2433 }, { "epoch": 0.07, "learning_rate": 1.9930364517013678e-05, "loss": 1.5461, "step": 2434 }, { "epoch": 0.07, "learning_rate": 1.9930260276592736e-05, "loss": 1.5015, "step": 2435 }, { "epoch": 0.07, "learning_rate": 1.9930155958482108e-05, "loss": 1.4092, "step": 2436 }, { "epoch": 0.07, "learning_rate": 1.9930051562682608e-05, "loss": 1.6094, "step": 2437 }, { "epoch": 0.07, "learning_rate": 1.9929947089195055e-05, "loss": 1.4653, "step": 2438 }, { "epoch": 0.07, "learning_rate": 1.9929842538020266e-05, "loss": 1.4514, "step": 2439 }, { "epoch": 0.07, "learning_rate": 1.9929737909159058e-05, "loss": 1.4968, "step": 2440 }, { "epoch": 0.07, "learning_rate": 1.992963320261225e-05, "loss": 1.521, "step": 2441 }, { "epoch": 0.07, "learning_rate": 1.9929528418380658e-05, "loss": 1.521, "step": 2442 }, { "epoch": 0.07, "learning_rate": 1.9929423556465107e-05, "loss": 1.4624, "step": 2443 }, { "epoch": 0.07, "learning_rate": 1.9929318616866416e-05, "loss": 1.6118, "step": 2444 }, { "epoch": 0.07, "learning_rate": 1.992921359958541e-05, "loss": 1.4893, "step": 2445 }, { "epoch": 0.07, "learning_rate": 1.9929108504622898e-05, "loss": 1.4414, "step": 2446 }, { "epoch": 0.07, "learning_rate": 1.9929003331979713e-05, "loss": 1.5796, "step": 2447 }, { "epoch": 0.07, "learning_rate": 1.9928898081656672e-05, "loss": 1.5156, "step": 2448 }, { "epoch": 0.07, "learning_rate": 1.9928792753654608e-05, "loss": 1.4062, "step": 2449 }, { "epoch": 0.07, "learning_rate": 1.9928687347974334e-05, "loss": 1.4658, "step": 2450 }, { "epoch": 0.07, "learning_rate": 1.992858186461668e-05, "loss": 1.5327, "step": 2451 }, { "epoch": 0.07, "learning_rate": 1.9928476303582468e-05, "loss": 1.4822, "step": 2452 }, { "epoch": 0.07, "learning_rate": 1.992837066487253e-05, "loss": 1.5752, "step": 2453 }, { "epoch": 0.07, "learning_rate": 1.9928264948487682e-05, "loss": 1.4824, "step": 2454 }, { "epoch": 0.07, "learning_rate": 1.9928159154428765e-05, "loss": 1.3259, "step": 2455 }, { "epoch": 0.07, "learning_rate": 1.9928053282696597e-05, "loss": 1.6035, "step": 2456 }, { "epoch": 0.07, "learning_rate": 1.9927947333292006e-05, "loss": 1.623, "step": 2457 }, { "epoch": 0.07, "learning_rate": 1.9927841306215825e-05, "loss": 1.53, "step": 2458 }, { "epoch": 0.07, "learning_rate": 1.9927735201468882e-05, "loss": 1.4292, "step": 2459 }, { "epoch": 0.07, "learning_rate": 1.992762901905201e-05, "loss": 1.5269, "step": 2460 }, { "epoch": 0.07, "learning_rate": 1.9927522758966033e-05, "loss": 1.4326, "step": 2461 }, { "epoch": 0.07, "learning_rate": 1.9927416421211787e-05, "loss": 1.4844, "step": 2462 }, { "epoch": 0.07, "learning_rate": 1.9927310005790103e-05, "loss": 1.5452, "step": 2463 }, { "epoch": 0.07, "learning_rate": 1.9927203512701816e-05, "loss": 1.6353, "step": 2464 }, { "epoch": 0.07, "learning_rate": 1.9927096941947756e-05, "loss": 1.5259, "step": 2465 }, { "epoch": 0.07, "learning_rate": 1.9926990293528755e-05, "loss": 1.4473, "step": 2466 }, { "epoch": 0.07, "learning_rate": 1.9926883567445654e-05, "loss": 1.5327, "step": 2467 }, { "epoch": 0.07, "learning_rate": 1.992677676369928e-05, "loss": 1.3884, "step": 2468 }, { "epoch": 0.07, "learning_rate": 1.9926669882290476e-05, "loss": 1.3696, "step": 2469 }, { "epoch": 0.07, "learning_rate": 1.992656292322007e-05, "loss": 1.3369, "step": 2470 }, { "epoch": 0.07, "learning_rate": 1.9926455886488907e-05, "loss": 1.5454, "step": 2471 }, { "epoch": 0.07, "learning_rate": 1.992634877209782e-05, "loss": 1.5347, "step": 2472 }, { "epoch": 0.07, "learning_rate": 1.992624158004765e-05, "loss": 1.4966, "step": 2473 }, { "epoch": 0.07, "learning_rate": 1.992613431033923e-05, "loss": 1.4844, "step": 2474 }, { "epoch": 0.07, "learning_rate": 1.9926026962973407e-05, "loss": 1.4653, "step": 2475 }, { "epoch": 0.07, "learning_rate": 1.992591953795101e-05, "loss": 1.5386, "step": 2476 }, { "epoch": 0.07, "learning_rate": 1.9925812035272892e-05, "loss": 1.4299, "step": 2477 }, { "epoch": 0.07, "learning_rate": 1.9925704454939887e-05, "loss": 1.5449, "step": 2478 }, { "epoch": 0.07, "learning_rate": 1.9925596796952836e-05, "loss": 1.6204, "step": 2479 }, { "epoch": 0.07, "learning_rate": 1.9925489061312582e-05, "loss": 1.4546, "step": 2480 }, { "epoch": 0.07, "learning_rate": 1.9925381248019973e-05, "loss": 1.3821, "step": 2481 }, { "epoch": 0.07, "learning_rate": 1.9925273357075846e-05, "loss": 1.3589, "step": 2482 }, { "epoch": 0.07, "learning_rate": 1.9925165388481047e-05, "loss": 1.4104, "step": 2483 }, { "epoch": 0.07, "learning_rate": 1.992505734223642e-05, "loss": 1.6011, "step": 2484 }, { "epoch": 0.07, "learning_rate": 1.9924949218342814e-05, "loss": 1.8203, "step": 2485 }, { "epoch": 0.07, "learning_rate": 1.9924841016801073e-05, "loss": 1.5845, "step": 2486 }, { "epoch": 0.07, "learning_rate": 1.9924732737612042e-05, "loss": 1.5239, "step": 2487 }, { "epoch": 0.07, "learning_rate": 1.9924624380776568e-05, "loss": 1.4187, "step": 2488 }, { "epoch": 0.07, "learning_rate": 1.9924515946295498e-05, "loss": 1.5903, "step": 2489 }, { "epoch": 0.07, "learning_rate": 1.9924407434169686e-05, "loss": 1.5645, "step": 2490 }, { "epoch": 0.07, "learning_rate": 1.9924298844399975e-05, "loss": 1.5774, "step": 2491 }, { "epoch": 0.07, "learning_rate": 1.9924190176987217e-05, "loss": 1.6172, "step": 2492 }, { "epoch": 0.07, "learning_rate": 1.992408143193226e-05, "loss": 1.3853, "step": 2493 }, { "epoch": 0.07, "learning_rate": 1.9923972609235956e-05, "loss": 1.5989, "step": 2494 }, { "epoch": 0.07, "learning_rate": 1.992386370889916e-05, "loss": 1.5339, "step": 2495 }, { "epoch": 0.07, "learning_rate": 1.9923754730922723e-05, "loss": 1.427, "step": 2496 }, { "epoch": 0.07, "learning_rate": 1.992364567530749e-05, "loss": 1.5396, "step": 2497 }, { "epoch": 0.07, "learning_rate": 1.992353654205432e-05, "loss": 1.583, "step": 2498 }, { "epoch": 0.07, "learning_rate": 1.9923427331164072e-05, "loss": 1.7739, "step": 2499 }, { "epoch": 0.07, "learning_rate": 1.992331804263759e-05, "loss": 1.4915, "step": 2500 }, { "epoch": 0.07, "learning_rate": 1.9923208676475736e-05, "loss": 1.52, "step": 2501 }, { "epoch": 0.07, "learning_rate": 1.992309923267936e-05, "loss": 1.4678, "step": 2502 }, { "epoch": 0.07, "learning_rate": 1.9922989711249326e-05, "loss": 1.5518, "step": 2503 }, { "epoch": 0.07, "learning_rate": 1.9922880112186485e-05, "loss": 1.4348, "step": 2504 }, { "epoch": 0.07, "learning_rate": 1.99227704354917e-05, "loss": 1.604, "step": 2505 }, { "epoch": 0.07, "learning_rate": 1.9922660681165816e-05, "loss": 1.4558, "step": 2506 }, { "epoch": 0.07, "learning_rate": 1.992255084920971e-05, "loss": 1.5029, "step": 2507 }, { "epoch": 0.07, "learning_rate": 1.9922440939624226e-05, "loss": 1.4673, "step": 2508 }, { "epoch": 0.07, "learning_rate": 1.9922330952410235e-05, "loss": 1.4653, "step": 2509 }, { "epoch": 0.07, "learning_rate": 1.9922220887568585e-05, "loss": 1.5439, "step": 2510 }, { "epoch": 0.07, "learning_rate": 1.992211074510015e-05, "loss": 1.7407, "step": 2511 }, { "epoch": 0.07, "learning_rate": 1.9922000525005786e-05, "loss": 1.3999, "step": 2512 }, { "epoch": 0.07, "learning_rate": 1.9921890227286352e-05, "loss": 1.9185, "step": 2513 }, { "epoch": 0.07, "learning_rate": 1.9921779851942718e-05, "loss": 1.5581, "step": 2514 }, { "epoch": 0.07, "learning_rate": 1.9921669398975745e-05, "loss": 1.3713, "step": 2515 }, { "epoch": 0.07, "learning_rate": 1.9921558868386296e-05, "loss": 1.5422, "step": 2516 }, { "epoch": 0.07, "learning_rate": 1.9921448260175233e-05, "loss": 1.6301, "step": 2517 }, { "epoch": 0.07, "learning_rate": 1.9921337574343426e-05, "loss": 1.4265, "step": 2518 }, { "epoch": 0.07, "learning_rate": 1.9921226810891738e-05, "loss": 1.4385, "step": 2519 }, { "epoch": 0.07, "learning_rate": 1.9921115969821038e-05, "loss": 1.4402, "step": 2520 }, { "epoch": 0.07, "learning_rate": 1.9921005051132192e-05, "loss": 1.3552, "step": 2521 }, { "epoch": 0.07, "learning_rate": 1.9920894054826065e-05, "loss": 1.5991, "step": 2522 }, { "epoch": 0.07, "learning_rate": 1.992078298090353e-05, "loss": 1.4448, "step": 2523 }, { "epoch": 0.07, "learning_rate": 1.9920671829365454e-05, "loss": 1.6094, "step": 2524 }, { "epoch": 0.07, "learning_rate": 1.9920560600212707e-05, "loss": 1.5137, "step": 2525 }, { "epoch": 0.07, "learning_rate": 1.992044929344616e-05, "loss": 1.4241, "step": 2526 }, { "epoch": 0.07, "learning_rate": 1.992033790906668e-05, "loss": 1.437, "step": 2527 }, { "epoch": 0.07, "learning_rate": 1.992022644707514e-05, "loss": 1.6372, "step": 2528 }, { "epoch": 0.07, "learning_rate": 1.9920114907472415e-05, "loss": 1.4399, "step": 2529 }, { "epoch": 0.07, "learning_rate": 1.9920003290259377e-05, "loss": 1.5215, "step": 2530 }, { "epoch": 0.07, "learning_rate": 1.99198915954369e-05, "loss": 1.8115, "step": 2531 }, { "epoch": 0.07, "learning_rate": 1.991977982300585e-05, "loss": 1.8232, "step": 2532 }, { "epoch": 0.07, "learning_rate": 1.991966797296711e-05, "loss": 1.4761, "step": 2533 }, { "epoch": 0.07, "learning_rate": 1.9919556045321553e-05, "loss": 1.4875, "step": 2534 }, { "epoch": 0.07, "learning_rate": 1.9919444040070054e-05, "loss": 1.4697, "step": 2535 }, { "epoch": 0.07, "learning_rate": 1.9919331957213488e-05, "loss": 1.418, "step": 2536 }, { "epoch": 0.07, "learning_rate": 1.9919219796752732e-05, "loss": 1.519, "step": 2537 }, { "epoch": 0.07, "learning_rate": 1.9919107558688668e-05, "loss": 1.5132, "step": 2538 }, { "epoch": 0.07, "learning_rate": 1.991899524302217e-05, "loss": 1.502, "step": 2539 }, { "epoch": 0.07, "learning_rate": 1.9918882849754116e-05, "loss": 1.5042, "step": 2540 }, { "epoch": 0.07, "learning_rate": 1.9918770378885387e-05, "loss": 1.5066, "step": 2541 }, { "epoch": 0.07, "learning_rate": 1.9918657830416867e-05, "loss": 1.4204, "step": 2542 }, { "epoch": 0.07, "learning_rate": 1.9918545204349425e-05, "loss": 1.5654, "step": 2543 }, { "epoch": 0.07, "learning_rate": 1.9918432500683953e-05, "loss": 1.4348, "step": 2544 }, { "epoch": 0.07, "learning_rate": 1.991831971942133e-05, "loss": 1.4302, "step": 2545 }, { "epoch": 0.07, "learning_rate": 1.9918206860562433e-05, "loss": 1.6064, "step": 2546 }, { "epoch": 0.07, "learning_rate": 1.9918093924108154e-05, "loss": 1.6143, "step": 2547 }, { "epoch": 0.07, "learning_rate": 1.991798091005937e-05, "loss": 1.6343, "step": 2548 }, { "epoch": 0.07, "learning_rate": 1.991786781841697e-05, "loss": 1.6079, "step": 2549 }, { "epoch": 0.07, "learning_rate": 1.9917754649181835e-05, "loss": 1.5339, "step": 2550 }, { "epoch": 0.07, "learning_rate": 1.9917641402354846e-05, "loss": 1.2734, "step": 2551 }, { "epoch": 0.07, "learning_rate": 1.9917528077936898e-05, "loss": 1.7915, "step": 2552 }, { "epoch": 0.07, "learning_rate": 1.9917414675928875e-05, "loss": 1.3215, "step": 2553 }, { "epoch": 0.07, "learning_rate": 1.9917301196331662e-05, "loss": 1.4587, "step": 2554 }, { "epoch": 0.07, "learning_rate": 1.991718763914615e-05, "loss": 1.6372, "step": 2555 }, { "epoch": 0.07, "learning_rate": 1.9917074004373223e-05, "loss": 1.3865, "step": 2556 }, { "epoch": 0.07, "learning_rate": 1.991696029201377e-05, "loss": 1.3679, "step": 2557 }, { "epoch": 0.07, "learning_rate": 1.9916846502068688e-05, "loss": 1.4709, "step": 2558 }, { "epoch": 0.07, "learning_rate": 1.991673263453886e-05, "loss": 1.4607, "step": 2559 }, { "epoch": 0.07, "learning_rate": 1.991661868942518e-05, "loss": 1.502, "step": 2560 }, { "epoch": 0.07, "learning_rate": 1.9916504666728533e-05, "loss": 1.4553, "step": 2561 }, { "epoch": 0.07, "learning_rate": 1.9916390566449825e-05, "loss": 1.4971, "step": 2562 }, { "epoch": 0.07, "learning_rate": 1.9916276388589933e-05, "loss": 1.4075, "step": 2563 }, { "epoch": 0.07, "learning_rate": 1.991616213314976e-05, "loss": 1.6074, "step": 2564 }, { "epoch": 0.07, "learning_rate": 1.9916047800130198e-05, "loss": 1.4976, "step": 2565 }, { "epoch": 0.07, "learning_rate": 1.9915933389532143e-05, "loss": 1.4263, "step": 2566 }, { "epoch": 0.07, "learning_rate": 1.9915818901356486e-05, "loss": 1.4624, "step": 2567 }, { "epoch": 0.07, "learning_rate": 1.9915704335604124e-05, "loss": 1.4775, "step": 2568 }, { "epoch": 0.07, "learning_rate": 1.9915589692275955e-05, "loss": 1.4409, "step": 2569 }, { "epoch": 0.07, "learning_rate": 1.9915474971372872e-05, "loss": 1.5732, "step": 2570 }, { "epoch": 0.07, "learning_rate": 1.991536017289578e-05, "loss": 1.5479, "step": 2571 }, { "epoch": 0.07, "learning_rate": 1.9915245296845568e-05, "loss": 1.5986, "step": 2572 }, { "epoch": 0.07, "learning_rate": 1.9915130343223145e-05, "loss": 1.5439, "step": 2573 }, { "epoch": 0.07, "learning_rate": 1.99150153120294e-05, "loss": 1.4648, "step": 2574 }, { "epoch": 0.07, "learning_rate": 1.991490020326524e-05, "loss": 1.5205, "step": 2575 }, { "epoch": 0.07, "learning_rate": 1.991478501693156e-05, "loss": 1.4092, "step": 2576 }, { "epoch": 0.07, "learning_rate": 1.9914669753029264e-05, "loss": 1.6099, "step": 2577 }, { "epoch": 0.07, "learning_rate": 1.9914554411559257e-05, "loss": 1.564, "step": 2578 }, { "epoch": 0.07, "learning_rate": 1.9914438992522437e-05, "loss": 1.5503, "step": 2579 }, { "epoch": 0.07, "learning_rate": 1.991432349591971e-05, "loss": 1.3501, "step": 2580 }, { "epoch": 0.07, "learning_rate": 1.991420792175198e-05, "loss": 1.5508, "step": 2581 }, { "epoch": 0.07, "learning_rate": 1.9914092270020142e-05, "loss": 1.6714, "step": 2582 }, { "epoch": 0.07, "learning_rate": 1.9913976540725116e-05, "loss": 1.6211, "step": 2583 }, { "epoch": 0.07, "learning_rate": 1.9913860733867794e-05, "loss": 1.5894, "step": 2584 }, { "epoch": 0.07, "learning_rate": 1.9913744849449088e-05, "loss": 1.4666, "step": 2585 }, { "epoch": 0.07, "learning_rate": 1.9913628887469906e-05, "loss": 1.3928, "step": 2586 }, { "epoch": 0.07, "learning_rate": 1.9913512847931152e-05, "loss": 1.5044, "step": 2587 }, { "epoch": 0.07, "learning_rate": 1.9913396730833736e-05, "loss": 1.4141, "step": 2588 }, { "epoch": 0.07, "learning_rate": 1.9913280536178564e-05, "loss": 1.2554, "step": 2589 }, { "epoch": 0.07, "learning_rate": 1.9913164263966548e-05, "loss": 1.5537, "step": 2590 }, { "epoch": 0.07, "learning_rate": 1.9913047914198597e-05, "loss": 1.5571, "step": 2591 }, { "epoch": 0.07, "learning_rate": 1.991293148687562e-05, "loss": 1.5264, "step": 2592 }, { "epoch": 0.07, "learning_rate": 1.991281498199853e-05, "loss": 1.5728, "step": 2593 }, { "epoch": 0.07, "learning_rate": 1.9912698399568234e-05, "loss": 1.5552, "step": 2594 }, { "epoch": 0.07, "learning_rate": 1.9912581739585647e-05, "loss": 1.6143, "step": 2595 }, { "epoch": 0.07, "learning_rate": 1.9912465002051684e-05, "loss": 1.5659, "step": 2596 }, { "epoch": 0.07, "learning_rate": 1.9912348186967253e-05, "loss": 1.3694, "step": 2597 }, { "epoch": 0.07, "learning_rate": 1.9912231294333274e-05, "loss": 1.4631, "step": 2598 }, { "epoch": 0.07, "learning_rate": 1.9912114324150656e-05, "loss": 1.522, "step": 2599 }, { "epoch": 0.07, "learning_rate": 1.991199727642032e-05, "loss": 1.4185, "step": 2600 }, { "epoch": 0.07, "learning_rate": 1.9911880151143174e-05, "loss": 1.4224, "step": 2601 }, { "epoch": 0.07, "learning_rate": 1.9911762948320138e-05, "loss": 1.519, "step": 2602 }, { "epoch": 0.07, "learning_rate": 1.9911645667952134e-05, "loss": 1.5815, "step": 2603 }, { "epoch": 0.07, "learning_rate": 1.9911528310040073e-05, "loss": 1.6187, "step": 2604 }, { "epoch": 0.07, "learning_rate": 1.9911410874584877e-05, "loss": 1.5581, "step": 2605 }, { "epoch": 0.07, "learning_rate": 1.9911293361587457e-05, "loss": 1.6011, "step": 2606 }, { "epoch": 0.07, "learning_rate": 1.9911175771048744e-05, "loss": 1.4868, "step": 2607 }, { "epoch": 0.07, "learning_rate": 1.9911058102969653e-05, "loss": 1.4209, "step": 2608 }, { "epoch": 0.07, "learning_rate": 1.99109403573511e-05, "loss": 1.5, "step": 2609 }, { "epoch": 0.07, "learning_rate": 1.9910822534194013e-05, "loss": 1.6704, "step": 2610 }, { "epoch": 0.07, "learning_rate": 1.9910704633499312e-05, "loss": 1.5078, "step": 2611 }, { "epoch": 0.07, "learning_rate": 1.9910586655267914e-05, "loss": 1.5913, "step": 2612 }, { "epoch": 0.07, "learning_rate": 1.9910468599500746e-05, "loss": 1.5674, "step": 2613 }, { "epoch": 0.07, "learning_rate": 1.9910350466198736e-05, "loss": 1.6318, "step": 2614 }, { "epoch": 0.07, "learning_rate": 1.9910232255362804e-05, "loss": 1.5933, "step": 2615 }, { "epoch": 0.07, "learning_rate": 1.9910113966993873e-05, "loss": 1.4233, "step": 2616 }, { "epoch": 0.07, "learning_rate": 1.990999560109287e-05, "loss": 1.533, "step": 2617 }, { "epoch": 0.07, "learning_rate": 1.9909877157660724e-05, "loss": 1.5996, "step": 2618 }, { "epoch": 0.07, "learning_rate": 1.9909758636698355e-05, "loss": 1.8438, "step": 2619 }, { "epoch": 0.07, "learning_rate": 1.9909640038206698e-05, "loss": 1.5562, "step": 2620 }, { "epoch": 0.07, "learning_rate": 1.9909521362186677e-05, "loss": 1.425, "step": 2621 }, { "epoch": 0.07, "learning_rate": 1.990940260863922e-05, "loss": 1.4766, "step": 2622 }, { "epoch": 0.07, "learning_rate": 1.9909283777565257e-05, "loss": 1.5444, "step": 2623 }, { "epoch": 0.07, "learning_rate": 1.9909164868965714e-05, "loss": 1.5825, "step": 2624 }, { "epoch": 0.07, "learning_rate": 1.9909045882841528e-05, "loss": 1.6621, "step": 2625 }, { "epoch": 0.07, "learning_rate": 1.9908926819193627e-05, "loss": 1.4309, "step": 2626 }, { "epoch": 0.07, "learning_rate": 1.990880767802294e-05, "loss": 1.6018, "step": 2627 }, { "epoch": 0.07, "learning_rate": 1.99086884593304e-05, "loss": 1.5713, "step": 2628 }, { "epoch": 0.07, "learning_rate": 1.9908569163116943e-05, "loss": 1.5083, "step": 2629 }, { "epoch": 0.07, "learning_rate": 1.99084497893835e-05, "loss": 1.5137, "step": 2630 }, { "epoch": 0.07, "learning_rate": 1.9908330338131008e-05, "loss": 1.4497, "step": 2631 }, { "epoch": 0.07, "learning_rate": 1.9908210809360392e-05, "loss": 1.4761, "step": 2632 }, { "epoch": 0.07, "learning_rate": 1.99080912030726e-05, "loss": 1.8726, "step": 2633 }, { "epoch": 0.07, "learning_rate": 1.9907971519268558e-05, "loss": 1.6074, "step": 2634 }, { "epoch": 0.07, "learning_rate": 1.9907851757949207e-05, "loss": 1.5532, "step": 2635 }, { "epoch": 0.07, "learning_rate": 1.9907731919115486e-05, "loss": 1.5151, "step": 2636 }, { "epoch": 0.07, "learning_rate": 1.9907612002768326e-05, "loss": 1.459, "step": 2637 }, { "epoch": 0.07, "learning_rate": 1.990749200890867e-05, "loss": 1.3215, "step": 2638 }, { "epoch": 0.07, "learning_rate": 1.990737193753745e-05, "loss": 1.3369, "step": 2639 }, { "epoch": 0.07, "learning_rate": 1.9907251788655617e-05, "loss": 1.541, "step": 2640 }, { "epoch": 0.07, "learning_rate": 1.9907131562264102e-05, "loss": 1.4055, "step": 2641 }, { "epoch": 0.07, "learning_rate": 1.990701125836385e-05, "loss": 1.3696, "step": 2642 }, { "epoch": 0.07, "learning_rate": 1.99068908769558e-05, "loss": 1.5322, "step": 2643 }, { "epoch": 0.07, "learning_rate": 1.9906770418040895e-05, "loss": 1.5413, "step": 2644 }, { "epoch": 0.07, "learning_rate": 1.9906649881620075e-05, "loss": 1.6177, "step": 2645 }, { "epoch": 0.07, "learning_rate": 1.9906529267694283e-05, "loss": 1.4985, "step": 2646 }, { "epoch": 0.07, "learning_rate": 1.9906408576264468e-05, "loss": 1.5498, "step": 2647 }, { "epoch": 0.07, "learning_rate": 1.9906287807331572e-05, "loss": 1.8179, "step": 2648 }, { "epoch": 0.07, "learning_rate": 1.9906166960896533e-05, "loss": 1.6636, "step": 2649 }, { "epoch": 0.07, "learning_rate": 1.9906046036960304e-05, "loss": 1.449, "step": 2650 }, { "epoch": 0.07, "learning_rate": 1.9905925035523834e-05, "loss": 1.4792, "step": 2651 }, { "epoch": 0.07, "learning_rate": 1.990580395658806e-05, "loss": 1.5513, "step": 2652 }, { "epoch": 0.07, "learning_rate": 1.9905682800153935e-05, "loss": 1.582, "step": 2653 }, { "epoch": 0.07, "learning_rate": 1.99055615662224e-05, "loss": 1.5435, "step": 2654 }, { "epoch": 0.07, "learning_rate": 1.9905440254794416e-05, "loss": 1.4932, "step": 2655 }, { "epoch": 0.07, "learning_rate": 1.9905318865870926e-05, "loss": 1.4983, "step": 2656 }, { "epoch": 0.07, "learning_rate": 1.9905197399452873e-05, "loss": 1.5825, "step": 2657 }, { "epoch": 0.07, "learning_rate": 1.990507585554122e-05, "loss": 1.5405, "step": 2658 }, { "epoch": 0.07, "learning_rate": 1.9904954234136906e-05, "loss": 1.7041, "step": 2659 }, { "epoch": 0.07, "learning_rate": 1.9904832535240892e-05, "loss": 1.3186, "step": 2660 }, { "epoch": 0.07, "learning_rate": 1.990471075885412e-05, "loss": 1.522, "step": 2661 }, { "epoch": 0.07, "learning_rate": 1.9904588904977556e-05, "loss": 1.408, "step": 2662 }, { "epoch": 0.07, "learning_rate": 1.990446697361214e-05, "loss": 1.627, "step": 2663 }, { "epoch": 0.07, "learning_rate": 1.9904344964758833e-05, "loss": 1.4473, "step": 2664 }, { "epoch": 0.07, "learning_rate": 1.990422287841859e-05, "loss": 1.4658, "step": 2665 }, { "epoch": 0.07, "learning_rate": 1.9904100714592364e-05, "loss": 1.502, "step": 2666 }, { "epoch": 0.07, "learning_rate": 1.990397847328111e-05, "loss": 1.3765, "step": 2667 }, { "epoch": 0.07, "learning_rate": 1.9903856154485786e-05, "loss": 1.5576, "step": 2668 }, { "epoch": 0.07, "learning_rate": 1.990373375820735e-05, "loss": 1.5898, "step": 2669 }, { "epoch": 0.07, "learning_rate": 1.990361128444676e-05, "loss": 1.5635, "step": 2670 }, { "epoch": 0.07, "learning_rate": 1.9903488733204967e-05, "loss": 1.8745, "step": 2671 }, { "epoch": 0.07, "learning_rate": 1.990336610448294e-05, "loss": 1.3989, "step": 2672 }, { "epoch": 0.07, "learning_rate": 1.9903243398281628e-05, "loss": 1.5859, "step": 2673 }, { "epoch": 0.07, "learning_rate": 1.9903120614602e-05, "loss": 1.5884, "step": 2674 }, { "epoch": 0.07, "learning_rate": 1.9902997753445016e-05, "loss": 1.4783, "step": 2675 }, { "epoch": 0.07, "learning_rate": 1.990287481481163e-05, "loss": 1.5469, "step": 2676 }, { "epoch": 0.07, "learning_rate": 1.9902751798702807e-05, "loss": 1.5063, "step": 2677 }, { "epoch": 0.07, "learning_rate": 1.9902628705119514e-05, "loss": 1.6138, "step": 2678 }, { "epoch": 0.07, "learning_rate": 1.9902505534062708e-05, "loss": 1.3633, "step": 2679 }, { "epoch": 0.07, "learning_rate": 1.9902382285533358e-05, "loss": 1.5093, "step": 2680 }, { "epoch": 0.07, "learning_rate": 1.9902258959532424e-05, "loss": 1.5898, "step": 2681 }, { "epoch": 0.07, "learning_rate": 1.990213555606087e-05, "loss": 1.5601, "step": 2682 }, { "epoch": 0.07, "learning_rate": 1.990201207511967e-05, "loss": 1.4114, "step": 2683 }, { "epoch": 0.07, "learning_rate": 1.9901888516709777e-05, "loss": 1.405, "step": 2684 }, { "epoch": 0.07, "learning_rate": 1.9901764880832165e-05, "loss": 1.4927, "step": 2685 }, { "epoch": 0.07, "learning_rate": 1.9901641167487804e-05, "loss": 1.3831, "step": 2686 }, { "epoch": 0.07, "learning_rate": 1.9901517376677658e-05, "loss": 1.3936, "step": 2687 }, { "epoch": 0.07, "learning_rate": 1.9901393508402697e-05, "loss": 1.4219, "step": 2688 }, { "epoch": 0.07, "learning_rate": 1.9901269562663886e-05, "loss": 1.4292, "step": 2689 }, { "epoch": 0.07, "learning_rate": 1.99011455394622e-05, "loss": 1.5127, "step": 2690 }, { "epoch": 0.07, "learning_rate": 1.9901021438798604e-05, "loss": 1.6357, "step": 2691 }, { "epoch": 0.07, "learning_rate": 1.9900897260674074e-05, "loss": 1.5361, "step": 2692 }, { "epoch": 0.07, "learning_rate": 1.990077300508958e-05, "loss": 1.4629, "step": 2693 }, { "epoch": 0.07, "learning_rate": 1.9900648672046096e-05, "loss": 1.3936, "step": 2694 }, { "epoch": 0.07, "learning_rate": 1.990052426154459e-05, "loss": 1.5457, "step": 2695 }, { "epoch": 0.07, "learning_rate": 1.990039977358604e-05, "loss": 1.5024, "step": 2696 }, { "epoch": 0.07, "learning_rate": 1.9900275208171413e-05, "loss": 1.4241, "step": 2697 }, { "epoch": 0.07, "learning_rate": 1.990015056530169e-05, "loss": 1.4922, "step": 2698 }, { "epoch": 0.07, "learning_rate": 1.9900025844977846e-05, "loss": 1.5493, "step": 2699 }, { "epoch": 0.07, "learning_rate": 1.9899901047200855e-05, "loss": 1.3645, "step": 2700 }, { "epoch": 0.07, "learning_rate": 1.9899776171971693e-05, "loss": 1.5249, "step": 2701 }, { "epoch": 0.07, "learning_rate": 1.989965121929134e-05, "loss": 1.4316, "step": 2702 }, { "epoch": 0.07, "learning_rate": 1.9899526189160766e-05, "loss": 1.509, "step": 2703 }, { "epoch": 0.07, "learning_rate": 1.9899401081580956e-05, "loss": 1.457, "step": 2704 }, { "epoch": 0.07, "learning_rate": 1.9899275896552888e-05, "loss": 1.4072, "step": 2705 }, { "epoch": 0.07, "learning_rate": 1.989915063407754e-05, "loss": 1.4673, "step": 2706 }, { "epoch": 0.07, "learning_rate": 1.9899025294155893e-05, "loss": 1.48, "step": 2707 }, { "epoch": 0.07, "learning_rate": 1.9898899876788924e-05, "loss": 1.4705, "step": 2708 }, { "epoch": 0.07, "learning_rate": 1.9898774381977618e-05, "loss": 1.4761, "step": 2709 }, { "epoch": 0.07, "learning_rate": 1.989864880972296e-05, "loss": 1.4541, "step": 2710 }, { "epoch": 0.07, "learning_rate": 1.9898523160025922e-05, "loss": 1.5132, "step": 2711 }, { "epoch": 0.07, "learning_rate": 1.9898397432887498e-05, "loss": 1.5063, "step": 2712 }, { "epoch": 0.07, "learning_rate": 1.9898271628308667e-05, "loss": 1.3489, "step": 2713 }, { "epoch": 0.07, "learning_rate": 1.989814574629041e-05, "loss": 1.6992, "step": 2714 }, { "epoch": 0.07, "learning_rate": 1.9898019786833716e-05, "loss": 1.4373, "step": 2715 }, { "epoch": 0.07, "learning_rate": 1.9897893749939575e-05, "loss": 1.6421, "step": 2716 }, { "epoch": 0.07, "learning_rate": 1.989776763560896e-05, "loss": 1.46, "step": 2717 }, { "epoch": 0.07, "learning_rate": 1.989764144384287e-05, "loss": 1.6074, "step": 2718 }, { "epoch": 0.07, "learning_rate": 1.9897515174642288e-05, "loss": 1.3569, "step": 2719 }, { "epoch": 0.07, "learning_rate": 1.98973888280082e-05, "loss": 1.5137, "step": 2720 }, { "epoch": 0.07, "learning_rate": 1.9897262403941596e-05, "loss": 1.4136, "step": 2721 }, { "epoch": 0.07, "learning_rate": 1.9897135902443463e-05, "loss": 1.3748, "step": 2722 }, { "epoch": 0.07, "learning_rate": 1.9897009323514792e-05, "loss": 1.4045, "step": 2723 }, { "epoch": 0.07, "learning_rate": 1.989688266715658e-05, "loss": 1.614, "step": 2724 }, { "epoch": 0.07, "learning_rate": 1.9896755933369805e-05, "loss": 1.4595, "step": 2725 }, { "epoch": 0.07, "learning_rate": 1.989662912215547e-05, "loss": 1.5249, "step": 2726 }, { "epoch": 0.07, "learning_rate": 1.989650223351456e-05, "loss": 1.3809, "step": 2727 }, { "epoch": 0.07, "learning_rate": 1.989637526744807e-05, "loss": 1.4487, "step": 2728 }, { "epoch": 0.07, "learning_rate": 1.9896248223956998e-05, "loss": 1.583, "step": 2729 }, { "epoch": 0.07, "learning_rate": 1.989612110304233e-05, "loss": 1.5278, "step": 2730 }, { "epoch": 0.07, "learning_rate": 1.9895993904705064e-05, "loss": 1.5315, "step": 2731 }, { "epoch": 0.07, "learning_rate": 1.9895866628946196e-05, "loss": 1.52, "step": 2732 }, { "epoch": 0.07, "learning_rate": 1.9895739275766717e-05, "loss": 1.5029, "step": 2733 }, { "epoch": 0.07, "learning_rate": 1.989561184516763e-05, "loss": 1.4102, "step": 2734 }, { "epoch": 0.07, "learning_rate": 1.989548433714993e-05, "loss": 1.4458, "step": 2735 }, { "epoch": 0.07, "learning_rate": 1.9895356751714614e-05, "loss": 1.4209, "step": 2736 }, { "epoch": 0.07, "learning_rate": 1.989522908886268e-05, "loss": 1.4697, "step": 2737 }, { "epoch": 0.07, "learning_rate": 1.9895101348595123e-05, "loss": 1.418, "step": 2738 }, { "epoch": 0.07, "learning_rate": 1.989497353091295e-05, "loss": 1.5967, "step": 2739 }, { "epoch": 0.07, "learning_rate": 1.9894845635817158e-05, "loss": 1.4104, "step": 2740 }, { "epoch": 0.07, "learning_rate": 1.9894717663308744e-05, "loss": 1.4902, "step": 2741 }, { "epoch": 0.07, "learning_rate": 1.989458961338871e-05, "loss": 1.4329, "step": 2742 }, { "epoch": 0.07, "learning_rate": 1.989446148605806e-05, "loss": 1.3157, "step": 2743 }, { "epoch": 0.07, "learning_rate": 1.9894333281317803e-05, "loss": 1.4539, "step": 2744 }, { "epoch": 0.07, "learning_rate": 1.9894204999168926e-05, "loss": 1.4382, "step": 2745 }, { "epoch": 0.07, "learning_rate": 1.989407663961245e-05, "loss": 1.4651, "step": 2746 }, { "epoch": 0.08, "learning_rate": 1.9893948202649364e-05, "loss": 1.4763, "step": 2747 }, { "epoch": 0.08, "learning_rate": 1.989381968828068e-05, "loss": 1.5518, "step": 2748 }, { "epoch": 0.08, "learning_rate": 1.9893691096507405e-05, "loss": 1.3892, "step": 2749 }, { "epoch": 0.08, "learning_rate": 1.9893562427330546e-05, "loss": 1.5327, "step": 2750 }, { "epoch": 0.08, "learning_rate": 1.9893433680751105e-05, "loss": 1.4197, "step": 2751 }, { "epoch": 0.08, "learning_rate": 1.9893304856770088e-05, "loss": 1.4565, "step": 2752 }, { "epoch": 0.08, "learning_rate": 1.989317595538851e-05, "loss": 1.563, "step": 2753 }, { "epoch": 0.08, "learning_rate": 1.9893046976607372e-05, "loss": 1.605, "step": 2754 }, { "epoch": 0.08, "learning_rate": 1.989291792042769e-05, "loss": 1.6704, "step": 2755 }, { "epoch": 0.08, "learning_rate": 1.9892788786850468e-05, "loss": 1.4294, "step": 2756 }, { "epoch": 0.08, "learning_rate": 1.989265957587672e-05, "loss": 1.502, "step": 2757 }, { "epoch": 0.08, "learning_rate": 1.9892530287507453e-05, "loss": 1.5195, "step": 2758 }, { "epoch": 0.08, "learning_rate": 1.9892400921743685e-05, "loss": 1.5659, "step": 2759 }, { "epoch": 0.08, "learning_rate": 1.989227147858642e-05, "loss": 1.4124, "step": 2760 }, { "epoch": 0.08, "learning_rate": 1.9892141958036674e-05, "loss": 1.5659, "step": 2761 }, { "epoch": 0.08, "learning_rate": 1.9892012360095463e-05, "loss": 1.4722, "step": 2762 }, { "epoch": 0.08, "learning_rate": 1.98918826847638e-05, "loss": 1.4961, "step": 2763 }, { "epoch": 0.08, "learning_rate": 1.9891752932042695e-05, "loss": 1.5308, "step": 2764 }, { "epoch": 0.08, "learning_rate": 1.989162310193317e-05, "loss": 1.5, "step": 2765 }, { "epoch": 0.08, "learning_rate": 1.9891493194436235e-05, "loss": 1.5232, "step": 2766 }, { "epoch": 0.08, "learning_rate": 1.9891363209552908e-05, "loss": 1.4626, "step": 2767 }, { "epoch": 0.08, "learning_rate": 1.9891233147284207e-05, "loss": 1.4985, "step": 2768 }, { "epoch": 0.08, "learning_rate": 1.9891103007631152e-05, "loss": 1.532, "step": 2769 }, { "epoch": 0.08, "learning_rate": 1.9890972790594752e-05, "loss": 1.5518, "step": 2770 }, { "epoch": 0.08, "learning_rate": 1.9890842496176038e-05, "loss": 1.5942, "step": 2771 }, { "epoch": 0.08, "learning_rate": 1.9890712124376023e-05, "loss": 1.5056, "step": 2772 }, { "epoch": 0.08, "learning_rate": 1.9890581675195723e-05, "loss": 1.9102, "step": 2773 }, { "epoch": 0.08, "learning_rate": 1.9890451148636164e-05, "loss": 1.728, "step": 2774 }, { "epoch": 0.08, "learning_rate": 1.989032054469837e-05, "loss": 1.5195, "step": 2775 }, { "epoch": 0.08, "learning_rate": 1.9890189863383354e-05, "loss": 1.5073, "step": 2776 }, { "epoch": 0.08, "learning_rate": 1.9890059104692146e-05, "loss": 1.5278, "step": 2777 }, { "epoch": 0.08, "learning_rate": 1.9889928268625766e-05, "loss": 1.3894, "step": 2778 }, { "epoch": 0.08, "learning_rate": 1.9889797355185237e-05, "loss": 1.5859, "step": 2779 }, { "epoch": 0.08, "learning_rate": 1.9889666364371586e-05, "loss": 1.3831, "step": 2780 }, { "epoch": 0.08, "learning_rate": 1.9889535296185835e-05, "loss": 1.7009, "step": 2781 }, { "epoch": 0.08, "learning_rate": 1.9889404150629005e-05, "loss": 1.5386, "step": 2782 }, { "epoch": 0.08, "learning_rate": 1.9889272927702135e-05, "loss": 1.8706, "step": 2783 }, { "epoch": 0.08, "learning_rate": 1.988914162740624e-05, "loss": 1.4961, "step": 2784 }, { "epoch": 0.08, "learning_rate": 1.988901024974235e-05, "loss": 1.4648, "step": 2785 }, { "epoch": 0.08, "learning_rate": 1.9888878794711497e-05, "loss": 1.6758, "step": 2786 }, { "epoch": 0.08, "learning_rate": 1.9888747262314703e-05, "loss": 1.5117, "step": 2787 }, { "epoch": 0.08, "learning_rate": 1.9888615652553006e-05, "loss": 1.4924, "step": 2788 }, { "epoch": 0.08, "learning_rate": 1.9888483965427423e-05, "loss": 1.5583, "step": 2789 }, { "epoch": 0.08, "learning_rate": 1.9888352200938996e-05, "loss": 1.6206, "step": 2790 }, { "epoch": 0.08, "learning_rate": 1.988822035908875e-05, "loss": 1.5723, "step": 2791 }, { "epoch": 0.08, "learning_rate": 1.988808843987772e-05, "loss": 1.5503, "step": 2792 }, { "epoch": 0.08, "learning_rate": 1.988795644330693e-05, "loss": 1.5693, "step": 2793 }, { "epoch": 0.08, "learning_rate": 1.9887824369377423e-05, "loss": 1.4373, "step": 2794 }, { "epoch": 0.08, "learning_rate": 1.9887692218090226e-05, "loss": 1.6533, "step": 2795 }, { "epoch": 0.08, "learning_rate": 1.9887559989446376e-05, "loss": 1.4131, "step": 2796 }, { "epoch": 0.08, "learning_rate": 1.9887427683446907e-05, "loss": 1.5359, "step": 2797 }, { "epoch": 0.08, "learning_rate": 1.9887295300092848e-05, "loss": 1.416, "step": 2798 }, { "epoch": 0.08, "learning_rate": 1.9887162839385247e-05, "loss": 1.5229, "step": 2799 }, { "epoch": 0.08, "learning_rate": 1.9887030301325127e-05, "loss": 1.3369, "step": 2800 }, { "epoch": 0.08, "learning_rate": 1.9886897685913534e-05, "loss": 1.5552, "step": 2801 }, { "epoch": 0.08, "learning_rate": 1.9886764993151503e-05, "loss": 1.5635, "step": 2802 }, { "epoch": 0.08, "learning_rate": 1.988663222304007e-05, "loss": 1.6504, "step": 2803 }, { "epoch": 0.08, "learning_rate": 1.9886499375580278e-05, "loss": 1.4912, "step": 2804 }, { "epoch": 0.08, "learning_rate": 1.9886366450773164e-05, "loss": 1.4307, "step": 2805 }, { "epoch": 0.08, "learning_rate": 1.9886233448619765e-05, "loss": 1.4763, "step": 2806 }, { "epoch": 0.08, "learning_rate": 1.9886100369121125e-05, "loss": 1.5684, "step": 2807 }, { "epoch": 0.08, "learning_rate": 1.9885967212278287e-05, "loss": 1.3733, "step": 2808 }, { "epoch": 0.08, "learning_rate": 1.9885833978092287e-05, "loss": 1.5293, "step": 2809 }, { "epoch": 0.08, "learning_rate": 1.988570066656417e-05, "loss": 1.5107, "step": 2810 }, { "epoch": 0.08, "learning_rate": 1.9885567277694983e-05, "loss": 1.5796, "step": 2811 }, { "epoch": 0.08, "learning_rate": 1.9885433811485764e-05, "loss": 1.5117, "step": 2812 }, { "epoch": 0.08, "learning_rate": 1.988530026793756e-05, "loss": 1.4734, "step": 2813 }, { "epoch": 0.08, "learning_rate": 1.9885166647051414e-05, "loss": 1.4038, "step": 2814 }, { "epoch": 0.08, "learning_rate": 1.9885032948828375e-05, "loss": 1.3845, "step": 2815 }, { "epoch": 0.08, "learning_rate": 1.9884899173269484e-05, "loss": 1.5508, "step": 2816 }, { "epoch": 0.08, "learning_rate": 1.9884765320375793e-05, "loss": 1.5591, "step": 2817 }, { "epoch": 0.08, "learning_rate": 1.9884631390148343e-05, "loss": 1.4414, "step": 2818 }, { "epoch": 0.08, "learning_rate": 1.9884497382588185e-05, "loss": 1.438, "step": 2819 }, { "epoch": 0.08, "learning_rate": 1.988436329769637e-05, "loss": 1.5449, "step": 2820 }, { "epoch": 0.08, "learning_rate": 1.9884229135473943e-05, "loss": 1.5483, "step": 2821 }, { "epoch": 0.08, "learning_rate": 1.9884094895921956e-05, "loss": 1.4976, "step": 2822 }, { "epoch": 0.08, "learning_rate": 1.988396057904146e-05, "loss": 1.3948, "step": 2823 }, { "epoch": 0.08, "learning_rate": 1.98838261848335e-05, "loss": 1.5176, "step": 2824 }, { "epoch": 0.08, "learning_rate": 1.9883691713299133e-05, "loss": 1.4316, "step": 2825 }, { "epoch": 0.08, "learning_rate": 1.988355716443941e-05, "loss": 1.5161, "step": 2826 }, { "epoch": 0.08, "learning_rate": 1.9883422538255384e-05, "loss": 1.5569, "step": 2827 }, { "epoch": 0.08, "learning_rate": 1.9883287834748108e-05, "loss": 1.4917, "step": 2828 }, { "epoch": 0.08, "learning_rate": 1.9883153053918636e-05, "loss": 1.4727, "step": 2829 }, { "epoch": 0.08, "learning_rate": 1.9883018195768022e-05, "loss": 1.3926, "step": 2830 }, { "epoch": 0.08, "learning_rate": 1.9882883260297317e-05, "loss": 1.5366, "step": 2831 }, { "epoch": 0.08, "learning_rate": 1.9882748247507584e-05, "loss": 1.5508, "step": 2832 }, { "epoch": 0.08, "learning_rate": 1.9882613157399874e-05, "loss": 1.5071, "step": 2833 }, { "epoch": 0.08, "learning_rate": 1.9882477989975248e-05, "loss": 1.6414, "step": 2834 }, { "epoch": 0.08, "learning_rate": 1.9882342745234758e-05, "loss": 1.4961, "step": 2835 }, { "epoch": 0.08, "learning_rate": 1.988220742317947e-05, "loss": 1.4868, "step": 2836 }, { "epoch": 0.08, "learning_rate": 1.9882072023810436e-05, "loss": 1.4722, "step": 2837 }, { "epoch": 0.08, "learning_rate": 1.9881936547128717e-05, "loss": 1.5225, "step": 2838 }, { "epoch": 0.08, "learning_rate": 1.9881800993135373e-05, "loss": 1.8691, "step": 2839 }, { "epoch": 0.08, "learning_rate": 1.9881665361831466e-05, "loss": 1.584, "step": 2840 }, { "epoch": 0.08, "learning_rate": 1.9881529653218052e-05, "loss": 1.5164, "step": 2841 }, { "epoch": 0.08, "learning_rate": 1.98813938672962e-05, "loss": 1.5396, "step": 2842 }, { "epoch": 0.08, "learning_rate": 1.988125800406697e-05, "loss": 1.5093, "step": 2843 }, { "epoch": 0.08, "learning_rate": 1.988112206353142e-05, "loss": 1.3611, "step": 2844 }, { "epoch": 0.08, "learning_rate": 1.988098604569062e-05, "loss": 1.6074, "step": 2845 }, { "epoch": 0.08, "learning_rate": 1.9880849950545634e-05, "loss": 1.2783, "step": 2846 }, { "epoch": 0.08, "learning_rate": 1.9880713778097523e-05, "loss": 1.4673, "step": 2847 }, { "epoch": 0.08, "learning_rate": 1.9880577528347353e-05, "loss": 1.4214, "step": 2848 }, { "epoch": 0.08, "learning_rate": 1.9880441201296186e-05, "loss": 1.4321, "step": 2849 }, { "epoch": 0.08, "learning_rate": 1.9880304796945098e-05, "loss": 1.3206, "step": 2850 }, { "epoch": 0.08, "learning_rate": 1.9880168315295152e-05, "loss": 1.6187, "step": 2851 }, { "epoch": 0.08, "learning_rate": 1.9880031756347412e-05, "loss": 1.5005, "step": 2852 }, { "epoch": 0.08, "learning_rate": 1.987989512010295e-05, "loss": 1.5493, "step": 2853 }, { "epoch": 0.08, "learning_rate": 1.9879758406562836e-05, "loss": 1.4141, "step": 2854 }, { "epoch": 0.08, "learning_rate": 1.9879621615728137e-05, "loss": 1.4995, "step": 2855 }, { "epoch": 0.08, "learning_rate": 1.9879484747599927e-05, "loss": 1.3994, "step": 2856 }, { "epoch": 0.08, "learning_rate": 1.987934780217927e-05, "loss": 1.3318, "step": 2857 }, { "epoch": 0.08, "learning_rate": 1.987921077946724e-05, "loss": 1.5059, "step": 2858 }, { "epoch": 0.08, "learning_rate": 1.9879073679464914e-05, "loss": 1.5547, "step": 2859 }, { "epoch": 0.08, "learning_rate": 1.987893650217336e-05, "loss": 1.3503, "step": 2860 }, { "epoch": 0.08, "learning_rate": 1.9878799247593654e-05, "loss": 1.4731, "step": 2861 }, { "epoch": 0.08, "learning_rate": 1.9878661915726865e-05, "loss": 1.4976, "step": 2862 }, { "epoch": 0.08, "learning_rate": 1.9878524506574073e-05, "loss": 1.8125, "step": 2863 }, { "epoch": 0.08, "learning_rate": 1.987838702013635e-05, "loss": 1.5806, "step": 2864 }, { "epoch": 0.08, "learning_rate": 1.9878249456414772e-05, "loss": 1.4819, "step": 2865 }, { "epoch": 0.08, "learning_rate": 1.9878111815410414e-05, "loss": 1.5425, "step": 2866 }, { "epoch": 0.08, "learning_rate": 1.9877974097124356e-05, "loss": 1.5317, "step": 2867 }, { "epoch": 0.08, "learning_rate": 1.987783630155767e-05, "loss": 1.4573, "step": 2868 }, { "epoch": 0.08, "learning_rate": 1.9877698428711444e-05, "loss": 1.8257, "step": 2869 }, { "epoch": 0.08, "learning_rate": 1.9877560478586746e-05, "loss": 1.6597, "step": 2870 }, { "epoch": 0.08, "learning_rate": 1.987742245118466e-05, "loss": 1.4241, "step": 2871 }, { "epoch": 0.08, "learning_rate": 1.9877284346506264e-05, "loss": 1.3523, "step": 2872 }, { "epoch": 0.08, "learning_rate": 1.9877146164552642e-05, "loss": 1.5046, "step": 2873 }, { "epoch": 0.08, "learning_rate": 1.9877007905324876e-05, "loss": 1.5171, "step": 2874 }, { "epoch": 0.08, "learning_rate": 1.987686956882404e-05, "loss": 1.4937, "step": 2875 }, { "epoch": 0.08, "learning_rate": 1.987673115505122e-05, "loss": 1.6348, "step": 2876 }, { "epoch": 0.08, "learning_rate": 1.9876592664007505e-05, "loss": 1.302, "step": 2877 }, { "epoch": 0.08, "learning_rate": 1.987645409569397e-05, "loss": 1.5264, "step": 2878 }, { "epoch": 0.08, "learning_rate": 1.98763154501117e-05, "loss": 1.4463, "step": 2879 }, { "epoch": 0.08, "learning_rate": 1.9876176727261786e-05, "loss": 1.4709, "step": 2880 }, { "epoch": 0.08, "learning_rate": 1.9876037927145305e-05, "loss": 1.563, "step": 2881 }, { "epoch": 0.08, "learning_rate": 1.9875899049763353e-05, "loss": 1.5122, "step": 2882 }, { "epoch": 0.08, "learning_rate": 1.9875760095117007e-05, "loss": 1.4829, "step": 2883 }, { "epoch": 0.08, "learning_rate": 1.987562106320736e-05, "loss": 1.522, "step": 2884 }, { "epoch": 0.08, "learning_rate": 1.9875481954035497e-05, "loss": 1.8071, "step": 2885 }, { "epoch": 0.08, "learning_rate": 1.9875342767602505e-05, "loss": 1.5244, "step": 2886 }, { "epoch": 0.08, "learning_rate": 1.9875203503909476e-05, "loss": 1.5352, "step": 2887 }, { "epoch": 0.08, "learning_rate": 1.98750641629575e-05, "loss": 1.4985, "step": 2888 }, { "epoch": 0.08, "learning_rate": 1.9874924744747665e-05, "loss": 1.46, "step": 2889 }, { "epoch": 0.08, "learning_rate": 1.987478524928106e-05, "loss": 1.4214, "step": 2890 }, { "epoch": 0.08, "learning_rate": 1.9874645676558782e-05, "loss": 1.5874, "step": 2891 }, { "epoch": 0.08, "learning_rate": 1.987450602658192e-05, "loss": 1.5659, "step": 2892 }, { "epoch": 0.08, "learning_rate": 1.9874366299351565e-05, "loss": 1.5542, "step": 2893 }, { "epoch": 0.08, "learning_rate": 1.987422649486881e-05, "loss": 1.4634, "step": 2894 }, { "epoch": 0.08, "learning_rate": 1.987408661313475e-05, "loss": 1.4023, "step": 2895 }, { "epoch": 0.08, "learning_rate": 1.987394665415048e-05, "loss": 1.3162, "step": 2896 }, { "epoch": 0.08, "learning_rate": 1.9873806617917094e-05, "loss": 1.4829, "step": 2897 }, { "epoch": 0.08, "learning_rate": 1.987366650443569e-05, "loss": 1.5403, "step": 2898 }, { "epoch": 0.08, "learning_rate": 1.987352631370736e-05, "loss": 1.4089, "step": 2899 }, { "epoch": 0.08, "learning_rate": 1.9873386045733203e-05, "loss": 1.5229, "step": 2900 }, { "epoch": 0.08, "learning_rate": 1.9873245700514317e-05, "loss": 1.5283, "step": 2901 }, { "epoch": 0.08, "learning_rate": 1.98731052780518e-05, "loss": 1.4377, "step": 2902 }, { "epoch": 0.08, "learning_rate": 1.987296477834675e-05, "loss": 1.4712, "step": 2903 }, { "epoch": 0.08, "learning_rate": 1.9872824201400263e-05, "loss": 1.2903, "step": 2904 }, { "epoch": 0.08, "learning_rate": 1.9872683547213446e-05, "loss": 1.5166, "step": 2905 }, { "epoch": 0.08, "learning_rate": 1.9872542815787397e-05, "loss": 1.3827, "step": 2906 }, { "epoch": 0.08, "learning_rate": 1.987240200712321e-05, "loss": 1.5364, "step": 2907 }, { "epoch": 0.08, "learning_rate": 1.9872261121221995e-05, "loss": 1.6304, "step": 2908 }, { "epoch": 0.08, "learning_rate": 1.9872120158084853e-05, "loss": 1.5913, "step": 2909 }, { "epoch": 0.08, "learning_rate": 1.987197911771288e-05, "loss": 1.582, "step": 2910 }, { "epoch": 0.08, "learning_rate": 1.987183800010719e-05, "loss": 1.5134, "step": 2911 }, { "epoch": 0.08, "learning_rate": 1.9871696805268877e-05, "loss": 1.5811, "step": 2912 }, { "epoch": 0.08, "learning_rate": 1.9871555533199053e-05, "loss": 1.457, "step": 2913 }, { "epoch": 0.08, "learning_rate": 1.9871414183898817e-05, "loss": 1.3059, "step": 2914 }, { "epoch": 0.08, "learning_rate": 1.9871272757369283e-05, "loss": 1.4788, "step": 2915 }, { "epoch": 0.08, "learning_rate": 1.987113125361155e-05, "loss": 1.3821, "step": 2916 }, { "epoch": 0.08, "learning_rate": 1.987098967262673e-05, "loss": 1.5371, "step": 2917 }, { "epoch": 0.08, "learning_rate": 1.9870848014415926e-05, "loss": 1.5356, "step": 2918 }, { "epoch": 0.08, "learning_rate": 1.987070627898025e-05, "loss": 1.502, "step": 2919 }, { "epoch": 0.08, "learning_rate": 1.9870564466320807e-05, "loss": 1.5417, "step": 2920 }, { "epoch": 0.08, "learning_rate": 1.9870422576438713e-05, "loss": 1.5405, "step": 2921 }, { "epoch": 0.08, "learning_rate": 1.9870280609335072e-05, "loss": 1.4036, "step": 2922 }, { "epoch": 0.08, "learning_rate": 1.9870138565011e-05, "loss": 1.6196, "step": 2923 }, { "epoch": 0.08, "learning_rate": 1.98699964434676e-05, "loss": 1.5249, "step": 2924 }, { "epoch": 0.08, "learning_rate": 1.986985424470599e-05, "loss": 1.4547, "step": 2925 }, { "epoch": 0.08, "learning_rate": 1.9869711968727286e-05, "loss": 1.3362, "step": 2926 }, { "epoch": 0.08, "learning_rate": 1.986956961553259e-05, "loss": 1.502, "step": 2927 }, { "epoch": 0.08, "learning_rate": 1.9869427185123025e-05, "loss": 1.6602, "step": 2928 }, { "epoch": 0.08, "learning_rate": 1.986928467749971e-05, "loss": 1.5569, "step": 2929 }, { "epoch": 0.08, "learning_rate": 1.986914209266374e-05, "loss": 1.4653, "step": 2930 }, { "epoch": 0.08, "learning_rate": 1.9868999430616253e-05, "loss": 1.428, "step": 2931 }, { "epoch": 0.08, "learning_rate": 1.986885669135835e-05, "loss": 1.5884, "step": 2932 }, { "epoch": 0.08, "learning_rate": 1.9868713874891153e-05, "loss": 1.5059, "step": 2933 }, { "epoch": 0.08, "learning_rate": 1.9868570981215783e-05, "loss": 1.5278, "step": 2934 }, { "epoch": 0.08, "learning_rate": 1.9868428010333352e-05, "loss": 1.6533, "step": 2935 }, { "epoch": 0.08, "learning_rate": 1.9868284962244977e-05, "loss": 1.3569, "step": 2936 }, { "epoch": 0.08, "learning_rate": 1.9868141836951787e-05, "loss": 1.4133, "step": 2937 }, { "epoch": 0.08, "learning_rate": 1.986799863445489e-05, "loss": 1.5801, "step": 2938 }, { "epoch": 0.08, "learning_rate": 1.9867855354755417e-05, "loss": 1.3843, "step": 2939 }, { "epoch": 0.08, "learning_rate": 1.9867711997854478e-05, "loss": 1.4392, "step": 2940 }, { "epoch": 0.08, "learning_rate": 1.986756856375321e-05, "loss": 1.5586, "step": 2941 }, { "epoch": 0.08, "learning_rate": 1.9867425052452716e-05, "loss": 1.603, "step": 2942 }, { "epoch": 0.08, "learning_rate": 1.986728146395413e-05, "loss": 1.324, "step": 2943 }, { "epoch": 0.08, "learning_rate": 1.9867137798258577e-05, "loss": 1.5342, "step": 2944 }, { "epoch": 0.08, "learning_rate": 1.9866994055367178e-05, "loss": 1.4714, "step": 2945 }, { "epoch": 0.08, "learning_rate": 1.9866850235281054e-05, "loss": 1.7451, "step": 2946 }, { "epoch": 0.08, "learning_rate": 1.9866706338001336e-05, "loss": 1.3379, "step": 2947 }, { "epoch": 0.08, "learning_rate": 1.9866562363529146e-05, "loss": 1.2351, "step": 2948 }, { "epoch": 0.08, "learning_rate": 1.9866418311865614e-05, "loss": 1.668, "step": 2949 }, { "epoch": 0.08, "learning_rate": 1.9866274183011862e-05, "loss": 1.3917, "step": 2950 }, { "epoch": 0.08, "learning_rate": 1.9866129976969023e-05, "loss": 1.7754, "step": 2951 }, { "epoch": 0.08, "learning_rate": 1.986598569373822e-05, "loss": 1.5918, "step": 2952 }, { "epoch": 0.08, "learning_rate": 1.9865841333320585e-05, "loss": 1.3628, "step": 2953 }, { "epoch": 0.08, "learning_rate": 1.9865696895717244e-05, "loss": 1.3184, "step": 2954 }, { "epoch": 0.08, "learning_rate": 1.9865552380929335e-05, "loss": 1.5217, "step": 2955 }, { "epoch": 0.08, "learning_rate": 1.986540778895798e-05, "loss": 1.5063, "step": 2956 }, { "epoch": 0.08, "learning_rate": 1.9865263119804313e-05, "loss": 1.4944, "step": 2957 }, { "epoch": 0.08, "learning_rate": 1.9865118373469467e-05, "loss": 1.5713, "step": 2958 }, { "epoch": 0.08, "learning_rate": 1.9864973549954576e-05, "loss": 1.5271, "step": 2959 }, { "epoch": 0.08, "learning_rate": 1.986482864926077e-05, "loss": 1.4111, "step": 2960 }, { "epoch": 0.08, "learning_rate": 1.986468367138918e-05, "loss": 1.4214, "step": 2961 }, { "epoch": 0.08, "learning_rate": 1.9864538616340946e-05, "loss": 1.4373, "step": 2962 }, { "epoch": 0.08, "learning_rate": 1.98643934841172e-05, "loss": 1.3911, "step": 2963 }, { "epoch": 0.08, "learning_rate": 1.9864248274719077e-05, "loss": 1.5288, "step": 2964 }, { "epoch": 0.08, "learning_rate": 1.9864102988147715e-05, "loss": 1.3931, "step": 2965 }, { "epoch": 0.08, "learning_rate": 1.986395762440425e-05, "loss": 1.4092, "step": 2966 }, { "epoch": 0.08, "learning_rate": 1.986381218348982e-05, "loss": 1.3401, "step": 2967 }, { "epoch": 0.08, "learning_rate": 1.986366666540556e-05, "loss": 1.4382, "step": 2968 }, { "epoch": 0.08, "learning_rate": 1.986352107015261e-05, "loss": 1.4604, "step": 2969 }, { "epoch": 0.08, "learning_rate": 1.986337539773211e-05, "loss": 1.4929, "step": 2970 }, { "epoch": 0.08, "learning_rate": 1.9863229648145202e-05, "loss": 1.415, "step": 2971 }, { "epoch": 0.08, "learning_rate": 1.986308382139302e-05, "loss": 1.4639, "step": 2972 }, { "epoch": 0.08, "learning_rate": 1.9862937917476707e-05, "loss": 1.5752, "step": 2973 }, { "epoch": 0.08, "learning_rate": 1.9862791936397408e-05, "loss": 1.3755, "step": 2974 }, { "epoch": 0.08, "learning_rate": 1.986264587815626e-05, "loss": 1.3813, "step": 2975 }, { "epoch": 0.08, "learning_rate": 1.9862499742754412e-05, "loss": 1.3562, "step": 2976 }, { "epoch": 0.08, "learning_rate": 1.9862353530193002e-05, "loss": 1.5166, "step": 2977 }, { "epoch": 0.08, "learning_rate": 1.9862207240473176e-05, "loss": 1.5732, "step": 2978 }, { "epoch": 0.08, "learning_rate": 1.9862060873596075e-05, "loss": 1.5229, "step": 2979 }, { "epoch": 0.08, "learning_rate": 1.986191442956285e-05, "loss": 1.3865, "step": 2980 }, { "epoch": 0.08, "learning_rate": 1.9861767908374646e-05, "loss": 1.3845, "step": 2981 }, { "epoch": 0.08, "learning_rate": 1.9861621310032602e-05, "loss": 1.4229, "step": 2982 }, { "epoch": 0.08, "learning_rate": 1.9861474634537875e-05, "loss": 1.4548, "step": 2983 }, { "epoch": 0.08, "learning_rate": 1.9861327881891605e-05, "loss": 1.3896, "step": 2984 }, { "epoch": 0.08, "learning_rate": 1.9861181052094946e-05, "loss": 1.3564, "step": 2985 }, { "epoch": 0.08, "learning_rate": 1.9861034145149038e-05, "loss": 1.553, "step": 2986 }, { "epoch": 0.08, "learning_rate": 1.986088716105504e-05, "loss": 1.3589, "step": 2987 }, { "epoch": 0.08, "learning_rate": 1.9860740099814095e-05, "loss": 1.2065, "step": 2988 }, { "epoch": 0.08, "learning_rate": 1.9860592961427358e-05, "loss": 1.52, "step": 2989 }, { "epoch": 0.08, "learning_rate": 1.986044574589598e-05, "loss": 1.5435, "step": 2990 }, { "epoch": 0.08, "learning_rate": 1.986029845322111e-05, "loss": 1.4624, "step": 2991 }, { "epoch": 0.08, "learning_rate": 1.98601510834039e-05, "loss": 1.4924, "step": 2992 }, { "epoch": 0.08, "learning_rate": 1.9860003636445504e-05, "loss": 1.5879, "step": 2993 }, { "epoch": 0.08, "learning_rate": 1.9859856112347078e-05, "loss": 1.4229, "step": 2994 }, { "epoch": 0.08, "learning_rate": 1.9859708511109774e-05, "loss": 1.6191, "step": 2995 }, { "epoch": 0.08, "learning_rate": 1.985956083273475e-05, "loss": 1.647, "step": 2996 }, { "epoch": 0.08, "learning_rate": 1.9859413077223154e-05, "loss": 1.6123, "step": 2997 }, { "epoch": 0.08, "learning_rate": 1.9859265244576144e-05, "loss": 1.4402, "step": 2998 }, { "epoch": 0.08, "learning_rate": 1.9859117334794883e-05, "loss": 1.3589, "step": 2999 }, { "epoch": 0.08, "learning_rate": 1.9858969347880524e-05, "loss": 1.3672, "step": 3000 }, { "epoch": 0.08, "learning_rate": 1.9858821283834223e-05, "loss": 1.4094, "step": 3001 }, { "epoch": 0.08, "learning_rate": 1.9858673142657143e-05, "loss": 1.4531, "step": 3002 }, { "epoch": 0.08, "learning_rate": 1.985852492435044e-05, "loss": 1.5652, "step": 3003 }, { "epoch": 0.08, "learning_rate": 1.985837662891527e-05, "loss": 1.4922, "step": 3004 }, { "epoch": 0.08, "learning_rate": 1.98582282563528e-05, "loss": 1.5569, "step": 3005 }, { "epoch": 0.08, "learning_rate": 1.985807980666419e-05, "loss": 1.3992, "step": 3006 }, { "epoch": 0.08, "learning_rate": 1.9857931279850592e-05, "loss": 1.4819, "step": 3007 }, { "epoch": 0.08, "learning_rate": 1.985778267591318e-05, "loss": 1.4148, "step": 3008 }, { "epoch": 0.08, "learning_rate": 1.985763399485311e-05, "loss": 1.4783, "step": 3009 }, { "epoch": 0.08, "learning_rate": 1.985748523667155e-05, "loss": 1.3149, "step": 3010 }, { "epoch": 0.08, "learning_rate": 1.985733640136966e-05, "loss": 1.5793, "step": 3011 }, { "epoch": 0.08, "learning_rate": 1.9857187488948605e-05, "loss": 1.5046, "step": 3012 }, { "epoch": 0.08, "learning_rate": 1.985703849940955e-05, "loss": 1.5625, "step": 3013 }, { "epoch": 0.08, "learning_rate": 1.985688943275366e-05, "loss": 1.6421, "step": 3014 }, { "epoch": 0.08, "learning_rate": 1.98567402889821e-05, "loss": 1.4316, "step": 3015 }, { "epoch": 0.08, "learning_rate": 1.9856591068096042e-05, "loss": 1.4536, "step": 3016 }, { "epoch": 0.08, "learning_rate": 1.985644177009665e-05, "loss": 1.5115, "step": 3017 }, { "epoch": 0.08, "learning_rate": 1.9856292394985093e-05, "loss": 1.5249, "step": 3018 }, { "epoch": 0.08, "learning_rate": 1.9856142942762537e-05, "loss": 1.4817, "step": 3019 }, { "epoch": 0.08, "learning_rate": 1.9855993413430156e-05, "loss": 1.438, "step": 3020 }, { "epoch": 0.08, "learning_rate": 1.9855843806989117e-05, "loss": 1.4231, "step": 3021 }, { "epoch": 0.08, "learning_rate": 1.985569412344059e-05, "loss": 1.603, "step": 3022 }, { "epoch": 0.08, "learning_rate": 1.9855544362785743e-05, "loss": 1.4763, "step": 3023 }, { "epoch": 0.08, "learning_rate": 1.9855394525025756e-05, "loss": 1.5801, "step": 3024 }, { "epoch": 0.08, "learning_rate": 1.9855244610161796e-05, "loss": 1.4045, "step": 3025 }, { "epoch": 0.08, "learning_rate": 1.9855094618195036e-05, "loss": 1.5693, "step": 3026 }, { "epoch": 0.08, "learning_rate": 1.9854944549126647e-05, "loss": 1.3879, "step": 3027 }, { "epoch": 0.08, "learning_rate": 1.985479440295781e-05, "loss": 1.3506, "step": 3028 }, { "epoch": 0.08, "learning_rate": 1.9854644179689693e-05, "loss": 1.5781, "step": 3029 }, { "epoch": 0.08, "learning_rate": 1.9854493879323475e-05, "loss": 1.3933, "step": 3030 }, { "epoch": 0.08, "learning_rate": 1.985434350186033e-05, "loss": 1.3416, "step": 3031 }, { "epoch": 0.08, "learning_rate": 1.9854193047301438e-05, "loss": 1.4282, "step": 3032 }, { "epoch": 0.08, "learning_rate": 1.985404251564797e-05, "loss": 1.5151, "step": 3033 }, { "epoch": 0.08, "learning_rate": 1.985389190690111e-05, "loss": 1.3386, "step": 3034 }, { "epoch": 0.08, "learning_rate": 1.985374122106203e-05, "loss": 1.3962, "step": 3035 }, { "epoch": 0.08, "learning_rate": 1.9853590458131913e-05, "loss": 1.5588, "step": 3036 }, { "epoch": 0.08, "learning_rate": 1.985343961811194e-05, "loss": 1.3643, "step": 3037 }, { "epoch": 0.08, "learning_rate": 1.9853288701003287e-05, "loss": 1.3333, "step": 3038 }, { "epoch": 0.08, "learning_rate": 1.9853137706807137e-05, "loss": 1.5962, "step": 3039 }, { "epoch": 0.08, "learning_rate": 1.9852986635524673e-05, "loss": 1.5771, "step": 3040 }, { "epoch": 0.08, "learning_rate": 1.985283548715707e-05, "loss": 1.6594, "step": 3041 }, { "epoch": 0.08, "learning_rate": 1.985268426170552e-05, "loss": 1.4841, "step": 3042 }, { "epoch": 0.08, "learning_rate": 1.98525329591712e-05, "loss": 1.4434, "step": 3043 }, { "epoch": 0.08, "learning_rate": 1.9852381579555292e-05, "loss": 1.4333, "step": 3044 }, { "epoch": 0.08, "learning_rate": 1.9852230122858986e-05, "loss": 1.4189, "step": 3045 }, { "epoch": 0.08, "learning_rate": 1.9852078589083465e-05, "loss": 1.4026, "step": 3046 }, { "epoch": 0.08, "learning_rate": 1.9851926978229914e-05, "loss": 1.4814, "step": 3047 }, { "epoch": 0.08, "learning_rate": 1.9851775290299516e-05, "loss": 1.5479, "step": 3048 }, { "epoch": 0.08, "learning_rate": 1.9851623525293463e-05, "loss": 1.5708, "step": 3049 }, { "epoch": 0.08, "learning_rate": 1.9851471683212942e-05, "loss": 1.5259, "step": 3050 }, { "epoch": 0.08, "learning_rate": 1.9851319764059137e-05, "loss": 1.5864, "step": 3051 }, { "epoch": 0.08, "learning_rate": 1.9851167767833236e-05, "loss": 1.5366, "step": 3052 }, { "epoch": 0.08, "learning_rate": 1.9851015694536437e-05, "loss": 1.4585, "step": 3053 }, { "epoch": 0.08, "learning_rate": 1.985086354416992e-05, "loss": 1.4958, "step": 3054 }, { "epoch": 0.08, "learning_rate": 1.985071131673488e-05, "loss": 1.5366, "step": 3055 }, { "epoch": 0.08, "learning_rate": 1.9850559012232505e-05, "loss": 1.6504, "step": 3056 }, { "epoch": 0.08, "learning_rate": 1.9850406630663987e-05, "loss": 1.4854, "step": 3057 }, { "epoch": 0.08, "learning_rate": 1.985025417203052e-05, "loss": 1.5571, "step": 3058 }, { "epoch": 0.08, "learning_rate": 1.98501016363333e-05, "loss": 1.3125, "step": 3059 }, { "epoch": 0.08, "learning_rate": 1.984994902357351e-05, "loss": 1.418, "step": 3060 }, { "epoch": 0.08, "learning_rate": 1.9849796333752357e-05, "loss": 1.5664, "step": 3061 }, { "epoch": 0.08, "learning_rate": 1.9849643566871028e-05, "loss": 1.6211, "step": 3062 }, { "epoch": 0.08, "learning_rate": 1.984949072293072e-05, "loss": 1.4202, "step": 3063 }, { "epoch": 0.08, "learning_rate": 1.9849337801932625e-05, "loss": 1.6963, "step": 3064 }, { "epoch": 0.08, "learning_rate": 1.9849184803877946e-05, "loss": 1.3301, "step": 3065 }, { "epoch": 0.08, "learning_rate": 1.9849031728767873e-05, "loss": 1.6086, "step": 3066 }, { "epoch": 0.08, "learning_rate": 1.9848878576603607e-05, "loss": 1.5322, "step": 3067 }, { "epoch": 0.08, "learning_rate": 1.9848725347386352e-05, "loss": 1.5479, "step": 3068 }, { "epoch": 0.08, "learning_rate": 1.9848572041117292e-05, "loss": 1.646, "step": 3069 }, { "epoch": 0.08, "learning_rate": 1.9848418657797642e-05, "loss": 1.5435, "step": 3070 }, { "epoch": 0.08, "learning_rate": 1.9848265197428596e-05, "loss": 1.5317, "step": 3071 }, { "epoch": 0.08, "learning_rate": 1.984811166001135e-05, "loss": 1.4875, "step": 3072 }, { "epoch": 0.08, "learning_rate": 1.9847958045547112e-05, "loss": 1.5454, "step": 3073 }, { "epoch": 0.08, "learning_rate": 1.9847804354037083e-05, "loss": 1.6086, "step": 3074 }, { "epoch": 0.08, "learning_rate": 1.9847650585482458e-05, "loss": 1.4148, "step": 3075 }, { "epoch": 0.08, "learning_rate": 1.984749673988445e-05, "loss": 1.3738, "step": 3076 }, { "epoch": 0.08, "learning_rate": 1.9847342817244256e-05, "loss": 1.3826, "step": 3077 }, { "epoch": 0.08, "learning_rate": 1.984718881756308e-05, "loss": 1.4102, "step": 3078 }, { "epoch": 0.08, "learning_rate": 1.9847034740842136e-05, "loss": 1.4648, "step": 3079 }, { "epoch": 0.08, "learning_rate": 1.984688058708262e-05, "loss": 1.4902, "step": 3080 }, { "epoch": 0.08, "learning_rate": 1.9846726356285736e-05, "loss": 1.5234, "step": 3081 }, { "epoch": 0.08, "learning_rate": 1.9846572048452698e-05, "loss": 1.4656, "step": 3082 }, { "epoch": 0.08, "learning_rate": 1.9846417663584713e-05, "loss": 1.6392, "step": 3083 }, { "epoch": 0.08, "learning_rate": 1.9846263201682982e-05, "loss": 1.4727, "step": 3084 }, { "epoch": 0.08, "learning_rate": 1.984610866274872e-05, "loss": 1.4768, "step": 3085 }, { "epoch": 0.08, "learning_rate": 1.9845954046783134e-05, "loss": 1.3914, "step": 3086 }, { "epoch": 0.08, "learning_rate": 1.9845799353787437e-05, "loss": 1.4756, "step": 3087 }, { "epoch": 0.08, "learning_rate": 1.984564458376283e-05, "loss": 1.4592, "step": 3088 }, { "epoch": 0.08, "learning_rate": 1.984548973671053e-05, "loss": 1.4631, "step": 3089 }, { "epoch": 0.08, "learning_rate": 1.9845334812631752e-05, "loss": 1.5015, "step": 3090 }, { "epoch": 0.08, "learning_rate": 1.9845179811527698e-05, "loss": 1.5823, "step": 3091 }, { "epoch": 0.08, "learning_rate": 1.9845024733399594e-05, "loss": 1.5664, "step": 3092 }, { "epoch": 0.08, "learning_rate": 1.984486957824864e-05, "loss": 1.6265, "step": 3093 }, { "epoch": 0.08, "learning_rate": 1.9844714346076058e-05, "loss": 1.4452, "step": 3094 }, { "epoch": 0.08, "learning_rate": 1.984455903688306e-05, "loss": 1.4641, "step": 3095 }, { "epoch": 0.08, "learning_rate": 1.9844403650670863e-05, "loss": 1.5857, "step": 3096 }, { "epoch": 0.08, "learning_rate": 1.984424818744068e-05, "loss": 1.5449, "step": 3097 }, { "epoch": 0.08, "learning_rate": 1.9844092647193728e-05, "loss": 1.4243, "step": 3098 }, { "epoch": 0.08, "learning_rate": 1.9843937029931223e-05, "loss": 1.3535, "step": 3099 }, { "epoch": 0.08, "learning_rate": 1.9843781335654386e-05, "loss": 1.4631, "step": 3100 }, { "epoch": 0.08, "learning_rate": 1.984362556436443e-05, "loss": 1.4771, "step": 3101 }, { "epoch": 0.08, "learning_rate": 1.9843469716062578e-05, "loss": 1.5837, "step": 3102 }, { "epoch": 0.08, "learning_rate": 1.9843313790750046e-05, "loss": 1.5742, "step": 3103 }, { "epoch": 0.08, "learning_rate": 1.9843157788428055e-05, "loss": 1.8159, "step": 3104 }, { "epoch": 0.08, "learning_rate": 1.9843001709097832e-05, "loss": 1.519, "step": 3105 }, { "epoch": 0.08, "learning_rate": 1.9842845552760585e-05, "loss": 1.5298, "step": 3106 }, { "epoch": 0.08, "learning_rate": 1.9842689319417546e-05, "loss": 1.3772, "step": 3107 }, { "epoch": 0.08, "learning_rate": 1.9842533009069936e-05, "loss": 1.4341, "step": 3108 }, { "epoch": 0.08, "learning_rate": 1.9842376621718974e-05, "loss": 1.4214, "step": 3109 }, { "epoch": 0.08, "learning_rate": 1.9842220157365887e-05, "loss": 1.5073, "step": 3110 }, { "epoch": 0.08, "learning_rate": 1.9842063616011893e-05, "loss": 1.5317, "step": 3111 }, { "epoch": 0.08, "learning_rate": 1.9841906997658225e-05, "loss": 1.6128, "step": 3112 }, { "epoch": 0.09, "learning_rate": 1.9841750302306103e-05, "loss": 1.4971, "step": 3113 }, { "epoch": 0.09, "learning_rate": 1.9841593529956756e-05, "loss": 1.4907, "step": 3114 }, { "epoch": 0.09, "learning_rate": 1.9841436680611408e-05, "loss": 1.6006, "step": 3115 }, { "epoch": 0.09, "learning_rate": 1.984127975427129e-05, "loss": 1.5806, "step": 3116 }, { "epoch": 0.09, "learning_rate": 1.9841122750937624e-05, "loss": 1.2927, "step": 3117 }, { "epoch": 0.09, "learning_rate": 1.984096567061164e-05, "loss": 1.4795, "step": 3118 }, { "epoch": 0.09, "learning_rate": 1.9840808513294573e-05, "loss": 1.4861, "step": 3119 }, { "epoch": 0.09, "learning_rate": 1.9840651278987642e-05, "loss": 1.3806, "step": 3120 }, { "epoch": 0.09, "learning_rate": 1.9840493967692088e-05, "loss": 1.3677, "step": 3121 }, { "epoch": 0.09, "learning_rate": 1.9840336579409132e-05, "loss": 1.4016, "step": 3122 }, { "epoch": 0.09, "learning_rate": 1.9840179114140013e-05, "loss": 1.7578, "step": 3123 }, { "epoch": 0.09, "learning_rate": 1.984002157188596e-05, "loss": 1.4951, "step": 3124 }, { "epoch": 0.09, "learning_rate": 1.9839863952648203e-05, "loss": 1.4856, "step": 3125 }, { "epoch": 0.09, "learning_rate": 1.983970625642798e-05, "loss": 1.4966, "step": 3126 }, { "epoch": 0.09, "learning_rate": 1.983954848322652e-05, "loss": 1.5381, "step": 3127 }, { "epoch": 0.09, "learning_rate": 1.983939063304506e-05, "loss": 1.4458, "step": 3128 }, { "epoch": 0.09, "learning_rate": 1.9839232705884836e-05, "loss": 1.3843, "step": 3129 }, { "epoch": 0.09, "learning_rate": 1.983907470174708e-05, "loss": 1.4749, "step": 3130 }, { "epoch": 0.09, "learning_rate": 1.9838916620633032e-05, "loss": 1.4961, "step": 3131 }, { "epoch": 0.09, "learning_rate": 1.9838758462543926e-05, "loss": 1.5854, "step": 3132 }, { "epoch": 0.09, "learning_rate": 1.9838600227480998e-05, "loss": 1.5273, "step": 3133 }, { "epoch": 0.09, "learning_rate": 1.9838441915445493e-05, "loss": 1.6069, "step": 3134 }, { "epoch": 0.09, "learning_rate": 1.983828352643864e-05, "loss": 1.272, "step": 3135 }, { "epoch": 0.09, "learning_rate": 1.9838125060461687e-05, "loss": 1.5542, "step": 3136 }, { "epoch": 0.09, "learning_rate": 1.9837966517515866e-05, "loss": 1.2726, "step": 3137 }, { "epoch": 0.09, "learning_rate": 1.9837807897602424e-05, "loss": 1.5662, "step": 3138 }, { "epoch": 0.09, "learning_rate": 1.98376492007226e-05, "loss": 1.5608, "step": 3139 }, { "epoch": 0.09, "learning_rate": 1.9837490426877633e-05, "loss": 1.7974, "step": 3140 }, { "epoch": 0.09, "learning_rate": 1.9837331576068766e-05, "loss": 1.4346, "step": 3141 }, { "epoch": 0.09, "learning_rate": 1.9837172648297246e-05, "loss": 1.5337, "step": 3142 }, { "epoch": 0.09, "learning_rate": 1.983701364356431e-05, "loss": 1.4536, "step": 3143 }, { "epoch": 0.09, "learning_rate": 1.9836854561871202e-05, "loss": 1.4785, "step": 3144 }, { "epoch": 0.09, "learning_rate": 1.9836695403219175e-05, "loss": 1.5173, "step": 3145 }, { "epoch": 0.09, "learning_rate": 1.9836536167609464e-05, "loss": 1.5901, "step": 3146 }, { "epoch": 0.09, "learning_rate": 1.9836376855043324e-05, "loss": 1.4717, "step": 3147 }, { "epoch": 0.09, "learning_rate": 1.9836217465521994e-05, "loss": 1.4326, "step": 3148 }, { "epoch": 0.09, "learning_rate": 1.9836057999046725e-05, "loss": 1.4009, "step": 3149 }, { "epoch": 0.09, "learning_rate": 1.9835898455618764e-05, "loss": 1.3613, "step": 3150 }, { "epoch": 0.09, "learning_rate": 1.9835738835239356e-05, "loss": 1.5601, "step": 3151 }, { "epoch": 0.09, "learning_rate": 1.9835579137909754e-05, "loss": 1.366, "step": 3152 }, { "epoch": 0.09, "learning_rate": 1.983541936363121e-05, "loss": 1.5876, "step": 3153 }, { "epoch": 0.09, "learning_rate": 1.9835259512404962e-05, "loss": 1.4521, "step": 3154 }, { "epoch": 0.09, "learning_rate": 1.9835099584232274e-05, "loss": 1.3657, "step": 3155 }, { "epoch": 0.09, "learning_rate": 1.983493957911439e-05, "loss": 1.4651, "step": 3156 }, { "epoch": 0.09, "learning_rate": 1.983477949705256e-05, "loss": 1.4233, "step": 3157 }, { "epoch": 0.09, "learning_rate": 1.9834619338048044e-05, "loss": 1.4465, "step": 3158 }, { "epoch": 0.09, "learning_rate": 1.9834459102102093e-05, "loss": 1.832, "step": 3159 }, { "epoch": 0.09, "learning_rate": 1.9834298789215954e-05, "loss": 1.626, "step": 3160 }, { "epoch": 0.09, "learning_rate": 1.983413839939089e-05, "loss": 1.4897, "step": 3161 }, { "epoch": 0.09, "learning_rate": 1.9833977932628148e-05, "loss": 1.4346, "step": 3162 }, { "epoch": 0.09, "learning_rate": 1.9833817388928987e-05, "loss": 1.5771, "step": 3163 }, { "epoch": 0.09, "learning_rate": 1.983365676829466e-05, "loss": 1.3857, "step": 3164 }, { "epoch": 0.09, "learning_rate": 1.9833496070726436e-05, "loss": 1.3843, "step": 3165 }, { "epoch": 0.09, "learning_rate": 1.9833335296225553e-05, "loss": 1.3955, "step": 3166 }, { "epoch": 0.09, "learning_rate": 1.9833174444793285e-05, "loss": 1.363, "step": 3167 }, { "epoch": 0.09, "learning_rate": 1.9833013516430882e-05, "loss": 1.3469, "step": 3168 }, { "epoch": 0.09, "learning_rate": 1.9832852511139603e-05, "loss": 1.4995, "step": 3169 }, { "epoch": 0.09, "learning_rate": 1.9832691428920713e-05, "loss": 1.519, "step": 3170 }, { "epoch": 0.09, "learning_rate": 1.9832530269775466e-05, "loss": 1.5598, "step": 3171 }, { "epoch": 0.09, "learning_rate": 1.9832369033705127e-05, "loss": 1.5464, "step": 3172 }, { "epoch": 0.09, "learning_rate": 1.9832207720710955e-05, "loss": 1.5229, "step": 3173 }, { "epoch": 0.09, "learning_rate": 1.9832046330794218e-05, "loss": 1.4634, "step": 3174 }, { "epoch": 0.09, "learning_rate": 1.983188486395617e-05, "loss": 1.4731, "step": 3175 }, { "epoch": 0.09, "learning_rate": 1.9831723320198076e-05, "loss": 1.5166, "step": 3176 }, { "epoch": 0.09, "learning_rate": 1.9831561699521206e-05, "loss": 1.5068, "step": 3177 }, { "epoch": 0.09, "learning_rate": 1.9831400001926818e-05, "loss": 1.4534, "step": 3178 }, { "epoch": 0.09, "learning_rate": 1.9831238227416178e-05, "loss": 1.5754, "step": 3179 }, { "epoch": 0.09, "learning_rate": 1.9831076375990558e-05, "loss": 1.554, "step": 3180 }, { "epoch": 0.09, "learning_rate": 1.9830914447651216e-05, "loss": 1.5547, "step": 3181 }, { "epoch": 0.09, "learning_rate": 1.9830752442399422e-05, "loss": 1.5359, "step": 3182 }, { "epoch": 0.09, "learning_rate": 1.9830590360236443e-05, "loss": 1.7788, "step": 3183 }, { "epoch": 0.09, "learning_rate": 1.983042820116355e-05, "loss": 1.6177, "step": 3184 }, { "epoch": 0.09, "learning_rate": 1.983026596518201e-05, "loss": 1.3547, "step": 3185 }, { "epoch": 0.09, "learning_rate": 1.983010365229309e-05, "loss": 1.5483, "step": 3186 }, { "epoch": 0.09, "learning_rate": 1.9829941262498062e-05, "loss": 1.5679, "step": 3187 }, { "epoch": 0.09, "learning_rate": 1.9829778795798192e-05, "loss": 1.4292, "step": 3188 }, { "epoch": 0.09, "learning_rate": 1.9829616252194757e-05, "loss": 1.4944, "step": 3189 }, { "epoch": 0.09, "learning_rate": 1.9829453631689032e-05, "loss": 1.5217, "step": 3190 }, { "epoch": 0.09, "learning_rate": 1.982929093428228e-05, "loss": 1.5767, "step": 3191 }, { "epoch": 0.09, "learning_rate": 1.982912815997578e-05, "loss": 1.5359, "step": 3192 }, { "epoch": 0.09, "learning_rate": 1.9828965308770798e-05, "loss": 1.6162, "step": 3193 }, { "epoch": 0.09, "learning_rate": 1.982880238066862e-05, "loss": 1.4033, "step": 3194 }, { "epoch": 0.09, "learning_rate": 1.9828639375670505e-05, "loss": 1.5771, "step": 3195 }, { "epoch": 0.09, "learning_rate": 1.9828476293777744e-05, "loss": 1.4644, "step": 3196 }, { "epoch": 0.09, "learning_rate": 1.9828313134991607e-05, "loss": 1.5933, "step": 3197 }, { "epoch": 0.09, "learning_rate": 1.9828149899313364e-05, "loss": 1.4849, "step": 3198 }, { "epoch": 0.09, "learning_rate": 1.9827986586744302e-05, "loss": 1.4583, "step": 3199 }, { "epoch": 0.09, "learning_rate": 1.9827823197285693e-05, "loss": 1.4512, "step": 3200 }, { "epoch": 0.09, "learning_rate": 1.9827659730938816e-05, "loss": 1.4897, "step": 3201 }, { "epoch": 0.09, "learning_rate": 1.9827496187704956e-05, "loss": 1.4546, "step": 3202 }, { "epoch": 0.09, "learning_rate": 1.9827332567585384e-05, "loss": 1.5261, "step": 3203 }, { "epoch": 0.09, "learning_rate": 1.9827168870581376e-05, "loss": 1.46, "step": 3204 }, { "epoch": 0.09, "learning_rate": 1.9827005096694227e-05, "loss": 1.5454, "step": 3205 }, { "epoch": 0.09, "learning_rate": 1.982684124592521e-05, "loss": 1.7593, "step": 3206 }, { "epoch": 0.09, "learning_rate": 1.982667731827561e-05, "loss": 1.3823, "step": 3207 }, { "epoch": 0.09, "learning_rate": 1.9826513313746702e-05, "loss": 1.5635, "step": 3208 }, { "epoch": 0.09, "learning_rate": 1.982634923233978e-05, "loss": 1.5032, "step": 3209 }, { "epoch": 0.09, "learning_rate": 1.982618507405612e-05, "loss": 1.3413, "step": 3210 }, { "epoch": 0.09, "learning_rate": 1.982602083889701e-05, "loss": 1.5859, "step": 3211 }, { "epoch": 0.09, "learning_rate": 1.982585652686373e-05, "loss": 1.4919, "step": 3212 }, { "epoch": 0.09, "learning_rate": 1.9825692137957574e-05, "loss": 1.509, "step": 3213 }, { "epoch": 0.09, "learning_rate": 1.982552767217982e-05, "loss": 1.4868, "step": 3214 }, { "epoch": 0.09, "learning_rate": 1.9825363129531755e-05, "loss": 1.4922, "step": 3215 }, { "epoch": 0.09, "learning_rate": 1.9825198510014674e-05, "loss": 1.4536, "step": 3216 }, { "epoch": 0.09, "learning_rate": 1.982503381362986e-05, "loss": 1.3604, "step": 3217 }, { "epoch": 0.09, "learning_rate": 1.98248690403786e-05, "loss": 1.4417, "step": 3218 }, { "epoch": 0.09, "learning_rate": 1.982470419026218e-05, "loss": 1.5693, "step": 3219 }, { "epoch": 0.09, "learning_rate": 1.9824539263281902e-05, "loss": 1.4285, "step": 3220 }, { "epoch": 0.09, "learning_rate": 1.9824374259439044e-05, "loss": 1.5068, "step": 3221 }, { "epoch": 0.09, "learning_rate": 1.9824209178734903e-05, "loss": 1.5391, "step": 3222 }, { "epoch": 0.09, "learning_rate": 1.982404402117077e-05, "loss": 1.5833, "step": 3223 }, { "epoch": 0.09, "learning_rate": 1.9823878786747933e-05, "loss": 1.4873, "step": 3224 }, { "epoch": 0.09, "learning_rate": 1.982371347546769e-05, "loss": 1.3921, "step": 3225 }, { "epoch": 0.09, "learning_rate": 1.9823548087331332e-05, "loss": 1.478, "step": 3226 }, { "epoch": 0.09, "learning_rate": 1.9823382622340156e-05, "loss": 1.4822, "step": 3227 }, { "epoch": 0.09, "learning_rate": 1.982321708049545e-05, "loss": 1.4165, "step": 3228 }, { "epoch": 0.09, "learning_rate": 1.9823051461798513e-05, "loss": 1.4521, "step": 3229 }, { "epoch": 0.09, "learning_rate": 1.9822885766250638e-05, "loss": 1.5137, "step": 3230 }, { "epoch": 0.09, "learning_rate": 1.9822719993853126e-05, "loss": 1.4194, "step": 3231 }, { "epoch": 0.09, "learning_rate": 1.9822554144607277e-05, "loss": 1.4133, "step": 3232 }, { "epoch": 0.09, "learning_rate": 1.9822388218514377e-05, "loss": 1.5781, "step": 3233 }, { "epoch": 0.09, "learning_rate": 1.982222221557573e-05, "loss": 1.5156, "step": 3234 }, { "epoch": 0.09, "learning_rate": 1.982205613579264e-05, "loss": 1.4658, "step": 3235 }, { "epoch": 0.09, "learning_rate": 1.98218899791664e-05, "loss": 1.4954, "step": 3236 }, { "epoch": 0.09, "learning_rate": 1.982172374569831e-05, "loss": 1.5042, "step": 3237 }, { "epoch": 0.09, "learning_rate": 1.9821557435389672e-05, "loss": 1.4438, "step": 3238 }, { "epoch": 0.09, "learning_rate": 1.9821391048241784e-05, "loss": 1.5527, "step": 3239 }, { "epoch": 0.09, "learning_rate": 1.9821224584255956e-05, "loss": 1.6133, "step": 3240 }, { "epoch": 0.09, "learning_rate": 1.9821058043433482e-05, "loss": 1.4839, "step": 3241 }, { "epoch": 0.09, "learning_rate": 1.982089142577567e-05, "loss": 1.7905, "step": 3242 }, { "epoch": 0.09, "learning_rate": 1.982072473128382e-05, "loss": 1.5391, "step": 3243 }, { "epoch": 0.09, "learning_rate": 1.9820557959959238e-05, "loss": 1.4927, "step": 3244 }, { "epoch": 0.09, "learning_rate": 1.982039111180323e-05, "loss": 1.4949, "step": 3245 }, { "epoch": 0.09, "learning_rate": 1.9820224186817097e-05, "loss": 1.3582, "step": 3246 }, { "epoch": 0.09, "learning_rate": 1.982005718500215e-05, "loss": 1.4492, "step": 3247 }, { "epoch": 0.09, "learning_rate": 1.9819890106359693e-05, "loss": 1.3804, "step": 3248 }, { "epoch": 0.09, "learning_rate": 1.9819722950891034e-05, "loss": 1.3318, "step": 3249 }, { "epoch": 0.09, "learning_rate": 1.981955571859748e-05, "loss": 1.4629, "step": 3250 }, { "epoch": 0.09, "learning_rate": 1.981938840948034e-05, "loss": 1.4485, "step": 3251 }, { "epoch": 0.09, "learning_rate": 1.9819221023540918e-05, "loss": 1.3882, "step": 3252 }, { "epoch": 0.09, "learning_rate": 1.9819053560780534e-05, "loss": 1.5659, "step": 3253 }, { "epoch": 0.09, "learning_rate": 1.981888602120049e-05, "loss": 1.5327, "step": 3254 }, { "epoch": 0.09, "learning_rate": 1.98187184048021e-05, "loss": 1.5122, "step": 3255 }, { "epoch": 0.09, "learning_rate": 1.981855071158667e-05, "loss": 1.4236, "step": 3256 }, { "epoch": 0.09, "learning_rate": 1.981838294155552e-05, "loss": 1.3359, "step": 3257 }, { "epoch": 0.09, "learning_rate": 1.981821509470996e-05, "loss": 1.4119, "step": 3258 }, { "epoch": 0.09, "learning_rate": 1.9818047171051298e-05, "loss": 1.5571, "step": 3259 }, { "epoch": 0.09, "learning_rate": 1.9817879170580853e-05, "loss": 1.4009, "step": 3260 }, { "epoch": 0.09, "learning_rate": 1.981771109329994e-05, "loss": 1.4546, "step": 3261 }, { "epoch": 0.09, "learning_rate": 1.9817542939209867e-05, "loss": 1.4114, "step": 3262 }, { "epoch": 0.09, "learning_rate": 1.981737470831196e-05, "loss": 1.4761, "step": 3263 }, { "epoch": 0.09, "learning_rate": 1.981720640060753e-05, "loss": 1.542, "step": 3264 }, { "epoch": 0.09, "learning_rate": 1.981703801609789e-05, "loss": 1.4185, "step": 3265 }, { "epoch": 0.09, "learning_rate": 1.9816869554784363e-05, "loss": 1.4907, "step": 3266 }, { "epoch": 0.09, "learning_rate": 1.9816701016668266e-05, "loss": 1.5762, "step": 3267 }, { "epoch": 0.09, "learning_rate": 1.981653240175091e-05, "loss": 1.4197, "step": 3268 }, { "epoch": 0.09, "learning_rate": 1.981636371003363e-05, "loss": 1.4231, "step": 3269 }, { "epoch": 0.09, "learning_rate": 1.9816194941517726e-05, "loss": 1.5039, "step": 3270 }, { "epoch": 0.09, "learning_rate": 1.9816026096204538e-05, "loss": 1.5374, "step": 3271 }, { "epoch": 0.09, "learning_rate": 1.981585717409537e-05, "loss": 1.4839, "step": 3272 }, { "epoch": 0.09, "learning_rate": 1.9815688175191558e-05, "loss": 1.4045, "step": 3273 }, { "epoch": 0.09, "learning_rate": 1.9815519099494413e-05, "loss": 1.429, "step": 3274 }, { "epoch": 0.09, "learning_rate": 1.9815349947005265e-05, "loss": 1.387, "step": 3275 }, { "epoch": 0.09, "learning_rate": 1.981518071772543e-05, "loss": 1.4624, "step": 3276 }, { "epoch": 0.09, "learning_rate": 1.9815011411656243e-05, "loss": 1.5117, "step": 3277 }, { "epoch": 0.09, "learning_rate": 1.981484202879902e-05, "loss": 1.4407, "step": 3278 }, { "epoch": 0.09, "learning_rate": 1.9814672569155083e-05, "loss": 1.4194, "step": 3279 }, { "epoch": 0.09, "learning_rate": 1.9814503032725768e-05, "loss": 1.4443, "step": 3280 }, { "epoch": 0.09, "learning_rate": 1.9814333419512394e-05, "loss": 1.4219, "step": 3281 }, { "epoch": 0.09, "learning_rate": 1.981416372951629e-05, "loss": 1.478, "step": 3282 }, { "epoch": 0.09, "learning_rate": 1.9813993962738787e-05, "loss": 1.5278, "step": 3283 }, { "epoch": 0.09, "learning_rate": 1.9813824119181207e-05, "loss": 1.8262, "step": 3284 }, { "epoch": 0.09, "learning_rate": 1.9813654198844885e-05, "loss": 1.2976, "step": 3285 }, { "epoch": 0.09, "learning_rate": 1.9813484201731144e-05, "loss": 1.5581, "step": 3286 }, { "epoch": 0.09, "learning_rate": 1.981331412784132e-05, "loss": 1.5649, "step": 3287 }, { "epoch": 0.09, "learning_rate": 1.981314397717674e-05, "loss": 1.5498, "step": 3288 }, { "epoch": 0.09, "learning_rate": 1.9812973749738736e-05, "loss": 1.3774, "step": 3289 }, { "epoch": 0.09, "learning_rate": 1.981280344552864e-05, "loss": 1.4014, "step": 3290 }, { "epoch": 0.09, "learning_rate": 1.9812633064547784e-05, "loss": 1.5024, "step": 3291 }, { "epoch": 0.09, "learning_rate": 1.98124626067975e-05, "loss": 1.3362, "step": 3292 }, { "epoch": 0.09, "learning_rate": 1.9812292072279122e-05, "loss": 1.4839, "step": 3293 }, { "epoch": 0.09, "learning_rate": 1.9812121460993985e-05, "loss": 1.3977, "step": 3294 }, { "epoch": 0.09, "learning_rate": 1.9811950772943425e-05, "loss": 1.3359, "step": 3295 }, { "epoch": 0.09, "learning_rate": 1.981178000812878e-05, "loss": 1.4109, "step": 3296 }, { "epoch": 0.09, "learning_rate": 1.9811609166551377e-05, "loss": 1.3684, "step": 3297 }, { "epoch": 0.09, "learning_rate": 1.9811438248212558e-05, "loss": 1.4438, "step": 3298 }, { "epoch": 0.09, "learning_rate": 1.981126725311366e-05, "loss": 1.4189, "step": 3299 }, { "epoch": 0.09, "learning_rate": 1.981109618125602e-05, "loss": 1.4639, "step": 3300 }, { "epoch": 0.09, "learning_rate": 1.981092503264098e-05, "loss": 1.4365, "step": 3301 }, { "epoch": 0.09, "learning_rate": 1.9810753807269875e-05, "loss": 1.519, "step": 3302 }, { "epoch": 0.09, "learning_rate": 1.9810582505144043e-05, "loss": 1.4895, "step": 3303 }, { "epoch": 0.09, "learning_rate": 1.981041112626483e-05, "loss": 1.5298, "step": 3304 }, { "epoch": 0.09, "learning_rate": 1.981023967063357e-05, "loss": 1.4075, "step": 3305 }, { "epoch": 0.09, "learning_rate": 1.981006813825161e-05, "loss": 1.5181, "step": 3306 }, { "epoch": 0.09, "learning_rate": 1.980989652912029e-05, "loss": 1.6309, "step": 3307 }, { "epoch": 0.09, "learning_rate": 1.980972484324095e-05, "loss": 1.6382, "step": 3308 }, { "epoch": 0.09, "learning_rate": 1.980955308061494e-05, "loss": 1.4077, "step": 3309 }, { "epoch": 0.09, "learning_rate": 1.9809381241243598e-05, "loss": 1.4443, "step": 3310 }, { "epoch": 0.09, "learning_rate": 1.980920932512827e-05, "loss": 1.3833, "step": 3311 }, { "epoch": 0.09, "learning_rate": 1.9809037332270297e-05, "loss": 1.7798, "step": 3312 }, { "epoch": 0.09, "learning_rate": 1.9808865262671033e-05, "loss": 1.3604, "step": 3313 }, { "epoch": 0.09, "learning_rate": 1.980869311633182e-05, "loss": 1.5474, "step": 3314 }, { "epoch": 0.09, "learning_rate": 1.9808520893254e-05, "loss": 1.5056, "step": 3315 }, { "epoch": 0.09, "learning_rate": 1.980834859343893e-05, "loss": 1.4355, "step": 3316 }, { "epoch": 0.09, "learning_rate": 1.980817621688795e-05, "loss": 1.4641, "step": 3317 }, { "epoch": 0.09, "learning_rate": 1.9808003763602407e-05, "loss": 1.4736, "step": 3318 }, { "epoch": 0.09, "learning_rate": 1.9807831233583662e-05, "loss": 1.4512, "step": 3319 }, { "epoch": 0.09, "learning_rate": 1.9807658626833053e-05, "loss": 1.3552, "step": 3320 }, { "epoch": 0.09, "learning_rate": 1.980748594335194e-05, "loss": 1.2402, "step": 3321 }, { "epoch": 0.09, "learning_rate": 1.9807313183141664e-05, "loss": 1.3096, "step": 3322 }, { "epoch": 0.09, "learning_rate": 1.980714034620358e-05, "loss": 1.4578, "step": 3323 }, { "epoch": 0.09, "learning_rate": 1.9806967432539043e-05, "loss": 1.248, "step": 3324 }, { "epoch": 0.09, "learning_rate": 1.9806794442149408e-05, "loss": 1.4973, "step": 3325 }, { "epoch": 0.09, "learning_rate": 1.9806621375036023e-05, "loss": 1.6431, "step": 3326 }, { "epoch": 0.09, "learning_rate": 1.980644823120024e-05, "loss": 1.5056, "step": 3327 }, { "epoch": 0.09, "learning_rate": 1.980627501064342e-05, "loss": 1.5066, "step": 3328 }, { "epoch": 0.09, "learning_rate": 1.9806101713366916e-05, "loss": 1.3699, "step": 3329 }, { "epoch": 0.09, "learning_rate": 1.9805928339372085e-05, "loss": 1.4463, "step": 3330 }, { "epoch": 0.09, "learning_rate": 1.980575488866028e-05, "loss": 1.3645, "step": 3331 }, { "epoch": 0.09, "learning_rate": 1.980558136123286e-05, "loss": 1.4731, "step": 3332 }, { "epoch": 0.09, "learning_rate": 1.980540775709118e-05, "loss": 1.5173, "step": 3333 }, { "epoch": 0.09, "learning_rate": 1.9805234076236605e-05, "loss": 1.7021, "step": 3334 }, { "epoch": 0.09, "learning_rate": 1.980506031867049e-05, "loss": 1.5581, "step": 3335 }, { "epoch": 0.09, "learning_rate": 1.9804886484394184e-05, "loss": 1.54, "step": 3336 }, { "epoch": 0.09, "learning_rate": 1.9804712573409067e-05, "loss": 1.5352, "step": 3337 }, { "epoch": 0.09, "learning_rate": 1.9804538585716484e-05, "loss": 1.4463, "step": 3338 }, { "epoch": 0.09, "learning_rate": 1.9804364521317806e-05, "loss": 1.4976, "step": 3339 }, { "epoch": 0.09, "learning_rate": 1.9804190380214386e-05, "loss": 1.6084, "step": 3340 }, { "epoch": 0.09, "learning_rate": 1.9804016162407593e-05, "loss": 1.4688, "step": 3341 }, { "epoch": 0.09, "learning_rate": 1.9803841867898788e-05, "loss": 1.2866, "step": 3342 }, { "epoch": 0.09, "learning_rate": 1.980366749668933e-05, "loss": 1.5469, "step": 3343 }, { "epoch": 0.09, "learning_rate": 1.9803493048780592e-05, "loss": 1.6184, "step": 3344 }, { "epoch": 0.09, "learning_rate": 1.9803318524173932e-05, "loss": 1.4697, "step": 3345 }, { "epoch": 0.09, "learning_rate": 1.9803143922870722e-05, "loss": 1.3635, "step": 3346 }, { "epoch": 0.09, "learning_rate": 1.9802969244872318e-05, "loss": 1.4819, "step": 3347 }, { "epoch": 0.09, "learning_rate": 1.9802794490180094e-05, "loss": 1.4668, "step": 3348 }, { "epoch": 0.09, "learning_rate": 1.980261965879542e-05, "loss": 1.4834, "step": 3349 }, { "epoch": 0.09, "learning_rate": 1.9802444750719652e-05, "loss": 1.4922, "step": 3350 }, { "epoch": 0.09, "learning_rate": 1.980226976595417e-05, "loss": 1.4678, "step": 3351 }, { "epoch": 0.09, "learning_rate": 1.980209470450034e-05, "loss": 1.4209, "step": 3352 }, { "epoch": 0.09, "learning_rate": 1.980191956635953e-05, "loss": 1.4404, "step": 3353 }, { "epoch": 0.09, "learning_rate": 1.9801744351533107e-05, "loss": 1.4072, "step": 3354 }, { "epoch": 0.09, "learning_rate": 1.9801569060022448e-05, "loss": 1.4929, "step": 3355 }, { "epoch": 0.09, "learning_rate": 1.980139369182892e-05, "loss": 1.5789, "step": 3356 }, { "epoch": 0.09, "learning_rate": 1.9801218246953898e-05, "loss": 1.3032, "step": 3357 }, { "epoch": 0.09, "learning_rate": 1.9801042725398752e-05, "loss": 1.4048, "step": 3358 }, { "epoch": 0.09, "learning_rate": 1.980086712716486e-05, "loss": 1.4866, "step": 3359 }, { "epoch": 0.09, "learning_rate": 1.9800691452253588e-05, "loss": 1.3523, "step": 3360 }, { "epoch": 0.09, "learning_rate": 1.9800515700666317e-05, "loss": 1.4419, "step": 3361 }, { "epoch": 0.09, "learning_rate": 1.9800339872404417e-05, "loss": 1.5562, "step": 3362 }, { "epoch": 0.09, "learning_rate": 1.980016396746927e-05, "loss": 1.6973, "step": 3363 }, { "epoch": 0.09, "learning_rate": 1.9799987985862245e-05, "loss": 1.5684, "step": 3364 }, { "epoch": 0.09, "learning_rate": 1.9799811927584723e-05, "loss": 1.627, "step": 3365 }, { "epoch": 0.09, "learning_rate": 1.9799635792638082e-05, "loss": 1.4141, "step": 3366 }, { "epoch": 0.09, "learning_rate": 1.97994595810237e-05, "loss": 1.3525, "step": 3367 }, { "epoch": 0.09, "learning_rate": 1.979928329274295e-05, "loss": 1.4224, "step": 3368 }, { "epoch": 0.09, "learning_rate": 1.979910692779722e-05, "loss": 1.4995, "step": 3369 }, { "epoch": 0.09, "learning_rate": 1.9798930486187886e-05, "loss": 1.3696, "step": 3370 }, { "epoch": 0.09, "learning_rate": 1.9798753967916325e-05, "loss": 1.4883, "step": 3371 }, { "epoch": 0.09, "learning_rate": 1.979857737298392e-05, "loss": 1.3821, "step": 3372 }, { "epoch": 0.09, "learning_rate": 1.9798400701392053e-05, "loss": 1.3723, "step": 3373 }, { "epoch": 0.09, "learning_rate": 1.979822395314211e-05, "loss": 1.5105, "step": 3374 }, { "epoch": 0.09, "learning_rate": 1.9798047128235463e-05, "loss": 1.3809, "step": 3375 }, { "epoch": 0.09, "learning_rate": 1.9797870226673508e-05, "loss": 1.4138, "step": 3376 }, { "epoch": 0.09, "learning_rate": 1.9797693248457626e-05, "loss": 1.3877, "step": 3377 }, { "epoch": 0.09, "learning_rate": 1.9797516193589196e-05, "loss": 1.458, "step": 3378 }, { "epoch": 0.09, "learning_rate": 1.9797339062069606e-05, "loss": 1.5449, "step": 3379 }, { "epoch": 0.09, "learning_rate": 1.979716185390024e-05, "loss": 1.4619, "step": 3380 }, { "epoch": 0.09, "learning_rate": 1.979698456908249e-05, "loss": 1.3545, "step": 3381 }, { "epoch": 0.09, "learning_rate": 1.9796807207617742e-05, "loss": 1.4556, "step": 3382 }, { "epoch": 0.09, "learning_rate": 1.9796629769507375e-05, "loss": 1.573, "step": 3383 }, { "epoch": 0.09, "learning_rate": 1.9796452254752787e-05, "loss": 1.5095, "step": 3384 }, { "epoch": 0.09, "learning_rate": 1.9796274663355365e-05, "loss": 1.8872, "step": 3385 }, { "epoch": 0.09, "learning_rate": 1.979609699531649e-05, "loss": 1.5396, "step": 3386 }, { "epoch": 0.09, "learning_rate": 1.9795919250637564e-05, "loss": 1.521, "step": 3387 }, { "epoch": 0.09, "learning_rate": 1.9795741429319974e-05, "loss": 1.4702, "step": 3388 }, { "epoch": 0.09, "learning_rate": 1.9795563531365106e-05, "loss": 1.4922, "step": 3389 }, { "epoch": 0.09, "learning_rate": 1.9795385556774356e-05, "loss": 1.4238, "step": 3390 }, { "epoch": 0.09, "learning_rate": 1.9795207505549113e-05, "loss": 1.2969, "step": 3391 }, { "epoch": 0.09, "learning_rate": 1.9795029377690777e-05, "loss": 1.4236, "step": 3392 }, { "epoch": 0.09, "learning_rate": 1.9794851173200733e-05, "loss": 1.4319, "step": 3393 }, { "epoch": 0.09, "learning_rate": 1.979467289208038e-05, "loss": 1.3203, "step": 3394 }, { "epoch": 0.09, "learning_rate": 1.9794494534331116e-05, "loss": 1.7554, "step": 3395 }, { "epoch": 0.09, "learning_rate": 1.9794316099954324e-05, "loss": 1.5198, "step": 3396 }, { "epoch": 0.09, "learning_rate": 1.9794137588951416e-05, "loss": 1.5955, "step": 3397 }, { "epoch": 0.09, "learning_rate": 1.979395900132378e-05, "loss": 1.5754, "step": 3398 }, { "epoch": 0.09, "learning_rate": 1.9793780337072813e-05, "loss": 1.5518, "step": 3399 }, { "epoch": 0.09, "learning_rate": 1.9793601596199914e-05, "loss": 1.4893, "step": 3400 }, { "epoch": 0.09, "learning_rate": 1.979342277870648e-05, "loss": 1.4966, "step": 3401 }, { "epoch": 0.09, "learning_rate": 1.9793243884593915e-05, "loss": 1.8047, "step": 3402 }, { "epoch": 0.09, "learning_rate": 1.979306491386361e-05, "loss": 1.3801, "step": 3403 }, { "epoch": 0.09, "learning_rate": 1.9792885866516976e-05, "loss": 1.5767, "step": 3404 }, { "epoch": 0.09, "learning_rate": 1.97927067425554e-05, "loss": 1.3706, "step": 3405 }, { "epoch": 0.09, "learning_rate": 1.97925275419803e-05, "loss": 1.3967, "step": 3406 }, { "epoch": 0.09, "learning_rate": 1.9792348264793065e-05, "loss": 1.5386, "step": 3407 }, { "epoch": 0.09, "learning_rate": 1.97921689109951e-05, "loss": 1.3445, "step": 3408 }, { "epoch": 0.09, "learning_rate": 1.9791989480587815e-05, "loss": 1.4226, "step": 3409 }, { "epoch": 0.09, "learning_rate": 1.9791809973572606e-05, "loss": 1.4878, "step": 3410 }, { "epoch": 0.09, "learning_rate": 1.979163038995088e-05, "loss": 1.3794, "step": 3411 }, { "epoch": 0.09, "learning_rate": 1.9791450729724043e-05, "loss": 1.939, "step": 3412 }, { "epoch": 0.09, "learning_rate": 1.9791270992893497e-05, "loss": 1.4973, "step": 3413 }, { "epoch": 0.09, "learning_rate": 1.9791091179460657e-05, "loss": 1.4878, "step": 3414 }, { "epoch": 0.09, "learning_rate": 1.9790911289426917e-05, "loss": 1.4338, "step": 3415 }, { "epoch": 0.09, "learning_rate": 1.9790731322793694e-05, "loss": 1.4343, "step": 3416 }, { "epoch": 0.09, "learning_rate": 1.9790551279562393e-05, "loss": 1.4031, "step": 3417 }, { "epoch": 0.09, "learning_rate": 1.9790371159734425e-05, "loss": 1.3433, "step": 3418 }, { "epoch": 0.09, "learning_rate": 1.9790190963311192e-05, "loss": 1.2021, "step": 3419 }, { "epoch": 0.09, "learning_rate": 1.979001069029411e-05, "loss": 1.5977, "step": 3420 }, { "epoch": 0.09, "learning_rate": 1.9789830340684593e-05, "loss": 1.7803, "step": 3421 }, { "epoch": 0.09, "learning_rate": 1.9789649914484043e-05, "loss": 1.4138, "step": 3422 }, { "epoch": 0.09, "learning_rate": 1.9789469411693875e-05, "loss": 1.4927, "step": 3423 }, { "epoch": 0.09, "learning_rate": 1.97892888323155e-05, "loss": 1.4331, "step": 3424 }, { "epoch": 0.09, "learning_rate": 1.9789108176350337e-05, "loss": 1.2925, "step": 3425 }, { "epoch": 0.09, "learning_rate": 1.978892744379979e-05, "loss": 1.4609, "step": 3426 }, { "epoch": 0.09, "learning_rate": 1.978874663466528e-05, "loss": 1.323, "step": 3427 }, { "epoch": 0.09, "learning_rate": 1.9788565748948222e-05, "loss": 1.5205, "step": 3428 }, { "epoch": 0.09, "learning_rate": 1.9788384786650023e-05, "loss": 1.4751, "step": 3429 }, { "epoch": 0.09, "learning_rate": 1.9788203747772107e-05, "loss": 1.5791, "step": 3430 }, { "epoch": 0.09, "learning_rate": 1.978802263231589e-05, "loss": 1.6514, "step": 3431 }, { "epoch": 0.09, "learning_rate": 1.9787841440282782e-05, "loss": 1.4446, "step": 3432 }, { "epoch": 0.09, "learning_rate": 1.978766017167421e-05, "loss": 1.5977, "step": 3433 }, { "epoch": 0.09, "learning_rate": 1.978747882649158e-05, "loss": 1.437, "step": 3434 }, { "epoch": 0.09, "learning_rate": 1.9787297404736325e-05, "loss": 1.4373, "step": 3435 }, { "epoch": 0.09, "learning_rate": 1.978711590640986e-05, "loss": 1.4746, "step": 3436 }, { "epoch": 0.09, "learning_rate": 1.9786934331513593e-05, "loss": 1.4956, "step": 3437 }, { "epoch": 0.09, "learning_rate": 1.9786752680048957e-05, "loss": 1.4617, "step": 3438 }, { "epoch": 0.09, "learning_rate": 1.9786570952017374e-05, "loss": 1.5918, "step": 3439 }, { "epoch": 0.09, "learning_rate": 1.978638914742026e-05, "loss": 1.3916, "step": 3440 }, { "epoch": 0.09, "learning_rate": 1.978620726625904e-05, "loss": 1.4373, "step": 3441 }, { "epoch": 0.09, "learning_rate": 1.9786025308535134e-05, "loss": 1.4819, "step": 3442 }, { "epoch": 0.09, "learning_rate": 1.9785843274249967e-05, "loss": 1.5264, "step": 3443 }, { "epoch": 0.09, "learning_rate": 1.9785661163404964e-05, "loss": 1.468, "step": 3444 }, { "epoch": 0.09, "learning_rate": 1.9785478976001552e-05, "loss": 1.7695, "step": 3445 }, { "epoch": 0.09, "learning_rate": 1.9785296712041155e-05, "loss": 1.5581, "step": 3446 }, { "epoch": 0.09, "learning_rate": 1.9785114371525195e-05, "loss": 1.3477, "step": 3447 }, { "epoch": 0.09, "learning_rate": 1.97849319544551e-05, "loss": 1.4548, "step": 3448 }, { "epoch": 0.09, "learning_rate": 1.97847494608323e-05, "loss": 1.5786, "step": 3449 }, { "epoch": 0.09, "learning_rate": 1.9784566890658224e-05, "loss": 1.3757, "step": 3450 }, { "epoch": 0.09, "learning_rate": 1.9784384243934297e-05, "loss": 1.2336, "step": 3451 }, { "epoch": 0.09, "learning_rate": 1.9784201520661946e-05, "loss": 1.3943, "step": 3452 }, { "epoch": 0.09, "learning_rate": 1.9784018720842604e-05, "loss": 1.3406, "step": 3453 }, { "epoch": 0.09, "learning_rate": 1.97838358444777e-05, "loss": 1.4094, "step": 3454 }, { "epoch": 0.09, "learning_rate": 1.9783652891568666e-05, "loss": 1.4619, "step": 3455 }, { "epoch": 0.09, "learning_rate": 1.9783469862116937e-05, "loss": 1.3088, "step": 3456 }, { "epoch": 0.09, "learning_rate": 1.9783286756123933e-05, "loss": 1.3542, "step": 3457 }, { "epoch": 0.09, "learning_rate": 1.9783103573591097e-05, "loss": 1.4377, "step": 3458 }, { "epoch": 0.09, "learning_rate": 1.978292031451986e-05, "loss": 1.6416, "step": 3459 }, { "epoch": 0.09, "learning_rate": 1.978273697891165e-05, "loss": 1.4255, "step": 3460 }, { "epoch": 0.09, "learning_rate": 1.978255356676791e-05, "loss": 1.502, "step": 3461 }, { "epoch": 0.09, "learning_rate": 1.9782370078090068e-05, "loss": 1.447, "step": 3462 }, { "epoch": 0.09, "learning_rate": 1.9782186512879568e-05, "loss": 1.5586, "step": 3463 }, { "epoch": 0.09, "learning_rate": 1.9782002871137835e-05, "loss": 1.4697, "step": 3464 }, { "epoch": 0.09, "learning_rate": 1.9781819152866312e-05, "loss": 1.5127, "step": 3465 }, { "epoch": 0.09, "learning_rate": 1.978163535806644e-05, "loss": 1.3857, "step": 3466 }, { "epoch": 0.09, "learning_rate": 1.978145148673965e-05, "loss": 1.5623, "step": 3467 }, { "epoch": 0.09, "learning_rate": 1.9781267538887382e-05, "loss": 1.5039, "step": 3468 }, { "epoch": 0.09, "learning_rate": 1.9781083514511078e-05, "loss": 1.4937, "step": 3469 }, { "epoch": 0.09, "learning_rate": 1.9780899413612175e-05, "loss": 1.584, "step": 3470 }, { "epoch": 0.09, "learning_rate": 1.9780715236192115e-05, "loss": 1.4951, "step": 3471 }, { "epoch": 0.09, "learning_rate": 1.978053098225234e-05, "loss": 1.394, "step": 3472 }, { "epoch": 0.09, "learning_rate": 1.9780346651794286e-05, "loss": 1.4453, "step": 3473 }, { "epoch": 0.09, "learning_rate": 1.97801622448194e-05, "loss": 1.3738, "step": 3474 }, { "epoch": 0.09, "learning_rate": 1.9779977761329124e-05, "loss": 1.3923, "step": 3475 }, { "epoch": 0.09, "learning_rate": 1.97797932013249e-05, "loss": 1.4573, "step": 3476 }, { "epoch": 0.09, "learning_rate": 1.9779608564808174e-05, "loss": 1.3809, "step": 3477 }, { "epoch": 0.09, "learning_rate": 1.977942385178039e-05, "loss": 1.2755, "step": 3478 }, { "epoch": 0.1, "learning_rate": 1.9779239062242988e-05, "loss": 1.6309, "step": 3479 }, { "epoch": 0.1, "learning_rate": 1.977905419619742e-05, "loss": 1.543, "step": 3480 }, { "epoch": 0.1, "learning_rate": 1.9778869253645134e-05, "loss": 1.4939, "step": 3481 }, { "epoch": 0.1, "learning_rate": 1.977868423458757e-05, "loss": 1.4536, "step": 3482 }, { "epoch": 0.1, "learning_rate": 1.9778499139026182e-05, "loss": 1.3767, "step": 3483 }, { "epoch": 0.1, "learning_rate": 1.977831396696241e-05, "loss": 1.4656, "step": 3484 }, { "epoch": 0.1, "learning_rate": 1.9778128718397712e-05, "loss": 1.3848, "step": 3485 }, { "epoch": 0.1, "learning_rate": 1.977794339333353e-05, "loss": 1.5239, "step": 3486 }, { "epoch": 0.1, "learning_rate": 1.977775799177132e-05, "loss": 1.5371, "step": 3487 }, { "epoch": 0.1, "learning_rate": 1.9777572513712525e-05, "loss": 1.4402, "step": 3488 }, { "epoch": 0.1, "learning_rate": 1.9777386959158605e-05, "loss": 1.561, "step": 3489 }, { "epoch": 0.1, "learning_rate": 1.9777201328111003e-05, "loss": 1.6138, "step": 3490 }, { "epoch": 0.1, "learning_rate": 1.977701562057118e-05, "loss": 1.5623, "step": 3491 }, { "epoch": 0.1, "learning_rate": 1.977682983654058e-05, "loss": 1.6731, "step": 3492 }, { "epoch": 0.1, "learning_rate": 1.9776643976020663e-05, "loss": 1.2905, "step": 3493 }, { "epoch": 0.1, "learning_rate": 1.977645803901288e-05, "loss": 1.4263, "step": 3494 }, { "epoch": 0.1, "learning_rate": 1.9776272025518686e-05, "loss": 1.3469, "step": 3495 }, { "epoch": 0.1, "learning_rate": 1.9776085935539536e-05, "loss": 1.4124, "step": 3496 }, { "epoch": 0.1, "learning_rate": 1.977589976907689e-05, "loss": 1.5977, "step": 3497 }, { "epoch": 0.1, "learning_rate": 1.9775713526132198e-05, "loss": 1.5786, "step": 3498 }, { "epoch": 0.1, "learning_rate": 1.9775527206706923e-05, "loss": 1.8467, "step": 3499 }, { "epoch": 0.1, "learning_rate": 1.9775340810802515e-05, "loss": 1.4668, "step": 3500 }, { "epoch": 0.1, "learning_rate": 1.977515433842044e-05, "loss": 1.6494, "step": 3501 }, { "epoch": 0.1, "learning_rate": 1.9774967789562157e-05, "loss": 1.4834, "step": 3502 }, { "epoch": 0.1, "learning_rate": 1.977478116422912e-05, "loss": 1.4241, "step": 3503 }, { "epoch": 0.1, "learning_rate": 1.9774594462422793e-05, "loss": 1.8228, "step": 3504 }, { "epoch": 0.1, "learning_rate": 1.9774407684144633e-05, "loss": 1.3999, "step": 3505 }, { "epoch": 0.1, "learning_rate": 1.9774220829396104e-05, "loss": 1.3887, "step": 3506 }, { "epoch": 0.1, "learning_rate": 1.9774033898178668e-05, "loss": 1.5176, "step": 3507 }, { "epoch": 0.1, "learning_rate": 1.9773846890493787e-05, "loss": 1.3198, "step": 3508 }, { "epoch": 0.1, "learning_rate": 1.9773659806342926e-05, "loss": 1.3289, "step": 3509 }, { "epoch": 0.1, "learning_rate": 1.977347264572754e-05, "loss": 1.4976, "step": 3510 }, { "epoch": 0.1, "learning_rate": 1.9773285408649106e-05, "loss": 1.4741, "step": 3511 }, { "epoch": 0.1, "learning_rate": 1.977309809510908e-05, "loss": 1.4766, "step": 3512 }, { "epoch": 0.1, "learning_rate": 1.977291070510893e-05, "loss": 1.4585, "step": 3513 }, { "epoch": 0.1, "learning_rate": 1.9772723238650124e-05, "loss": 1.5415, "step": 3514 }, { "epoch": 0.1, "learning_rate": 1.9772535695734126e-05, "loss": 1.4419, "step": 3515 }, { "epoch": 0.1, "learning_rate": 1.9772348076362404e-05, "loss": 1.4263, "step": 3516 }, { "epoch": 0.1, "learning_rate": 1.9772160380536423e-05, "loss": 1.4888, "step": 3517 }, { "epoch": 0.1, "learning_rate": 1.977197260825766e-05, "loss": 1.3845, "step": 3518 }, { "epoch": 0.1, "learning_rate": 1.977178475952758e-05, "loss": 1.5664, "step": 3519 }, { "epoch": 0.1, "learning_rate": 1.9771596834347644e-05, "loss": 1.5059, "step": 3520 }, { "epoch": 0.1, "learning_rate": 1.977140883271933e-05, "loss": 1.3855, "step": 3521 }, { "epoch": 0.1, "learning_rate": 1.9771220754644112e-05, "loss": 1.481, "step": 3522 }, { "epoch": 0.1, "learning_rate": 1.9771032600123455e-05, "loss": 1.5325, "step": 3523 }, { "epoch": 0.1, "learning_rate": 1.9770844369158833e-05, "loss": 1.583, "step": 3524 }, { "epoch": 0.1, "learning_rate": 1.977065606175172e-05, "loss": 1.4985, "step": 3525 }, { "epoch": 0.1, "learning_rate": 1.977046767790359e-05, "loss": 1.3911, "step": 3526 }, { "epoch": 0.1, "learning_rate": 1.9770279217615915e-05, "loss": 1.4103, "step": 3527 }, { "epoch": 0.1, "learning_rate": 1.977009068089017e-05, "loss": 1.5457, "step": 3528 }, { "epoch": 0.1, "learning_rate": 1.976990206772783e-05, "loss": 1.4333, "step": 3529 }, { "epoch": 0.1, "learning_rate": 1.9769713378130365e-05, "loss": 1.4631, "step": 3530 }, { "epoch": 0.1, "learning_rate": 1.9769524612099262e-05, "loss": 1.5974, "step": 3531 }, { "epoch": 0.1, "learning_rate": 1.9769335769635992e-05, "loss": 1.4314, "step": 3532 }, { "epoch": 0.1, "learning_rate": 1.9769146850742033e-05, "loss": 1.4189, "step": 3533 }, { "epoch": 0.1, "learning_rate": 1.9768957855418864e-05, "loss": 1.5483, "step": 3534 }, { "epoch": 0.1, "learning_rate": 1.9768768783667956e-05, "loss": 1.4858, "step": 3535 }, { "epoch": 0.1, "learning_rate": 1.97685796354908e-05, "loss": 1.5186, "step": 3536 }, { "epoch": 0.1, "learning_rate": 1.976839041088887e-05, "loss": 1.5444, "step": 3537 }, { "epoch": 0.1, "learning_rate": 1.9768201109863644e-05, "loss": 1.3806, "step": 3538 }, { "epoch": 0.1, "learning_rate": 1.9768011732416607e-05, "loss": 1.188, "step": 3539 }, { "epoch": 0.1, "learning_rate": 1.9767822278549242e-05, "loss": 1.5586, "step": 3540 }, { "epoch": 0.1, "learning_rate": 1.976763274826303e-05, "loss": 1.4456, "step": 3541 }, { "epoch": 0.1, "learning_rate": 1.9767443141559447e-05, "loss": 1.5203, "step": 3542 }, { "epoch": 0.1, "learning_rate": 1.9767253458439982e-05, "loss": 1.4912, "step": 3543 }, { "epoch": 0.1, "learning_rate": 1.976706369890612e-05, "loss": 1.5161, "step": 3544 }, { "epoch": 0.1, "learning_rate": 1.9766873862959347e-05, "loss": 1.3379, "step": 3545 }, { "epoch": 0.1, "learning_rate": 1.9766683950601148e-05, "loss": 1.5237, "step": 3546 }, { "epoch": 0.1, "learning_rate": 1.9766493961833e-05, "loss": 1.4766, "step": 3547 }, { "epoch": 0.1, "learning_rate": 1.97663038966564e-05, "loss": 1.3652, "step": 3548 }, { "epoch": 0.1, "learning_rate": 1.976611375507283e-05, "loss": 1.3262, "step": 3549 }, { "epoch": 0.1, "learning_rate": 1.9765923537083774e-05, "loss": 1.3101, "step": 3550 }, { "epoch": 0.1, "learning_rate": 1.9765733242690728e-05, "loss": 1.4478, "step": 3551 }, { "epoch": 0.1, "learning_rate": 1.9765542871895178e-05, "loss": 1.5225, "step": 3552 }, { "epoch": 0.1, "learning_rate": 1.976535242469861e-05, "loss": 1.582, "step": 3553 }, { "epoch": 0.1, "learning_rate": 1.9765161901102518e-05, "loss": 1.4231, "step": 3554 }, { "epoch": 0.1, "learning_rate": 1.9764971301108394e-05, "loss": 1.5688, "step": 3555 }, { "epoch": 0.1, "learning_rate": 1.976478062471772e-05, "loss": 1.4448, "step": 3556 }, { "epoch": 0.1, "learning_rate": 1.9764589871932003e-05, "loss": 1.564, "step": 3557 }, { "epoch": 0.1, "learning_rate": 1.976439904275272e-05, "loss": 1.5, "step": 3558 }, { "epoch": 0.1, "learning_rate": 1.976420813718137e-05, "loss": 1.5703, "step": 3559 }, { "epoch": 0.1, "learning_rate": 1.976401715521945e-05, "loss": 1.5342, "step": 3560 }, { "epoch": 0.1, "learning_rate": 1.9763826096868453e-05, "loss": 1.5005, "step": 3561 }, { "epoch": 0.1, "learning_rate": 1.9763634962129866e-05, "loss": 1.4758, "step": 3562 }, { "epoch": 0.1, "learning_rate": 1.9763443751005194e-05, "loss": 1.6099, "step": 3563 }, { "epoch": 0.1, "learning_rate": 1.976325246349593e-05, "loss": 1.4504, "step": 3564 }, { "epoch": 0.1, "learning_rate": 1.9763061099603567e-05, "loss": 1.3657, "step": 3565 }, { "epoch": 0.1, "learning_rate": 1.9762869659329605e-05, "loss": 1.5649, "step": 3566 }, { "epoch": 0.1, "learning_rate": 1.9762678142675544e-05, "loss": 1.4795, "step": 3567 }, { "epoch": 0.1, "learning_rate": 1.976248654964288e-05, "loss": 1.4917, "step": 3568 }, { "epoch": 0.1, "learning_rate": 1.9762294880233107e-05, "loss": 1.4868, "step": 3569 }, { "epoch": 0.1, "learning_rate": 1.9762103134447734e-05, "loss": 1.2644, "step": 3570 }, { "epoch": 0.1, "learning_rate": 1.9761911312288255e-05, "loss": 1.5415, "step": 3571 }, { "epoch": 0.1, "learning_rate": 1.9761719413756177e-05, "loss": 1.4316, "step": 3572 }, { "epoch": 0.1, "learning_rate": 1.976152743885299e-05, "loss": 1.5181, "step": 3573 }, { "epoch": 0.1, "learning_rate": 1.9761335387580205e-05, "loss": 1.3914, "step": 3574 }, { "epoch": 0.1, "learning_rate": 1.9761143259939318e-05, "loss": 1.5327, "step": 3575 }, { "epoch": 0.1, "learning_rate": 1.9760951055931844e-05, "loss": 1.5479, "step": 3576 }, { "epoch": 0.1, "learning_rate": 1.9760758775559275e-05, "loss": 1.6455, "step": 3577 }, { "epoch": 0.1, "learning_rate": 1.9760566418823117e-05, "loss": 1.5703, "step": 3578 }, { "epoch": 0.1, "learning_rate": 1.976037398572488e-05, "loss": 1.55, "step": 3579 }, { "epoch": 0.1, "learning_rate": 1.9760181476266066e-05, "loss": 1.6758, "step": 3580 }, { "epoch": 0.1, "learning_rate": 1.975998889044818e-05, "loss": 1.3606, "step": 3581 }, { "epoch": 0.1, "learning_rate": 1.9759796228272732e-05, "loss": 1.5093, "step": 3582 }, { "epoch": 0.1, "learning_rate": 1.9759603489741227e-05, "loss": 1.8564, "step": 3583 }, { "epoch": 0.1, "learning_rate": 1.9759410674855174e-05, "loss": 1.541, "step": 3584 }, { "epoch": 0.1, "learning_rate": 1.9759217783616084e-05, "loss": 1.4917, "step": 3585 }, { "epoch": 0.1, "learning_rate": 1.9759024816025457e-05, "loss": 1.4368, "step": 3586 }, { "epoch": 0.1, "learning_rate": 1.9758831772084815e-05, "loss": 1.2788, "step": 3587 }, { "epoch": 0.1, "learning_rate": 1.975863865179566e-05, "loss": 1.519, "step": 3588 }, { "epoch": 0.1, "learning_rate": 1.9758445455159504e-05, "loss": 1.4331, "step": 3589 }, { "epoch": 0.1, "learning_rate": 1.9758252182177856e-05, "loss": 1.5835, "step": 3590 }, { "epoch": 0.1, "learning_rate": 1.9758058832852235e-05, "loss": 1.324, "step": 3591 }, { "epoch": 0.1, "learning_rate": 1.9757865407184154e-05, "loss": 1.3584, "step": 3592 }, { "epoch": 0.1, "learning_rate": 1.9757671905175118e-05, "loss": 1.5596, "step": 3593 }, { "epoch": 0.1, "learning_rate": 1.9757478326826645e-05, "loss": 1.5723, "step": 3594 }, { "epoch": 0.1, "learning_rate": 1.9757284672140252e-05, "loss": 1.4221, "step": 3595 }, { "epoch": 0.1, "learning_rate": 1.975709094111745e-05, "loss": 1.6211, "step": 3596 }, { "epoch": 0.1, "learning_rate": 1.975689713375976e-05, "loss": 1.3396, "step": 3597 }, { "epoch": 0.1, "learning_rate": 1.975670325006869e-05, "loss": 1.626, "step": 3598 }, { "epoch": 0.1, "learning_rate": 1.9756509290045766e-05, "loss": 1.4309, "step": 3599 }, { "epoch": 0.1, "learning_rate": 1.97563152536925e-05, "loss": 1.5703, "step": 3600 }, { "epoch": 0.1, "learning_rate": 1.9756121141010413e-05, "loss": 1.4453, "step": 3601 }, { "epoch": 0.1, "learning_rate": 1.975592695200102e-05, "loss": 1.603, "step": 3602 }, { "epoch": 0.1, "learning_rate": 1.975573268666584e-05, "loss": 1.4048, "step": 3603 }, { "epoch": 0.1, "learning_rate": 1.9755538345006394e-05, "loss": 1.3245, "step": 3604 }, { "epoch": 0.1, "learning_rate": 1.9755343927024206e-05, "loss": 1.4873, "step": 3605 }, { "epoch": 0.1, "learning_rate": 1.97551494327208e-05, "loss": 1.3552, "step": 3606 }, { "epoch": 0.1, "learning_rate": 1.9754954862097683e-05, "loss": 1.5679, "step": 3607 }, { "epoch": 0.1, "learning_rate": 1.9754760215156387e-05, "loss": 1.4172, "step": 3608 }, { "epoch": 0.1, "learning_rate": 1.975456549189844e-05, "loss": 1.4897, "step": 3609 }, { "epoch": 0.1, "learning_rate": 1.9754370692325354e-05, "loss": 1.2725, "step": 3610 }, { "epoch": 0.1, "learning_rate": 1.9754175816438662e-05, "loss": 1.3281, "step": 3611 }, { "epoch": 0.1, "learning_rate": 1.9753980864239882e-05, "loss": 1.4114, "step": 3612 }, { "epoch": 0.1, "learning_rate": 1.9753785835730546e-05, "loss": 1.5874, "step": 3613 }, { "epoch": 0.1, "learning_rate": 1.9753590730912177e-05, "loss": 1.4355, "step": 3614 }, { "epoch": 0.1, "learning_rate": 1.9753395549786297e-05, "loss": 1.3982, "step": 3615 }, { "epoch": 0.1, "learning_rate": 1.9753200292354434e-05, "loss": 1.2947, "step": 3616 }, { "epoch": 0.1, "learning_rate": 1.9753004958618127e-05, "loss": 1.7642, "step": 3617 }, { "epoch": 0.1, "learning_rate": 1.9752809548578886e-05, "loss": 1.4551, "step": 3618 }, { "epoch": 0.1, "learning_rate": 1.9752614062238256e-05, "loss": 1.2346, "step": 3619 }, { "epoch": 0.1, "learning_rate": 1.9752418499597756e-05, "loss": 1.4038, "step": 3620 }, { "epoch": 0.1, "learning_rate": 1.975222286065892e-05, "loss": 1.4722, "step": 3621 }, { "epoch": 0.1, "learning_rate": 1.975202714542328e-05, "loss": 1.4399, "step": 3622 }, { "epoch": 0.1, "learning_rate": 1.9751831353892362e-05, "loss": 1.554, "step": 3623 }, { "epoch": 0.1, "learning_rate": 1.9751635486067707e-05, "loss": 1.6289, "step": 3624 }, { "epoch": 0.1, "learning_rate": 1.9751439541950835e-05, "loss": 1.5732, "step": 3625 }, { "epoch": 0.1, "learning_rate": 1.9751243521543287e-05, "loss": 1.4194, "step": 3626 }, { "epoch": 0.1, "learning_rate": 1.9751047424846596e-05, "loss": 1.5371, "step": 3627 }, { "epoch": 0.1, "learning_rate": 1.9750851251862296e-05, "loss": 1.4595, "step": 3628 }, { "epoch": 0.1, "learning_rate": 1.975065500259192e-05, "loss": 1.3867, "step": 3629 }, { "epoch": 0.1, "learning_rate": 1.9750458677037008e-05, "loss": 1.4927, "step": 3630 }, { "epoch": 0.1, "learning_rate": 1.975026227519909e-05, "loss": 1.5415, "step": 3631 }, { "epoch": 0.1, "learning_rate": 1.97500657970797e-05, "loss": 1.3643, "step": 3632 }, { "epoch": 0.1, "learning_rate": 1.9749869242680385e-05, "loss": 1.2578, "step": 3633 }, { "epoch": 0.1, "learning_rate": 1.974967261200268e-05, "loss": 1.4478, "step": 3634 }, { "epoch": 0.1, "learning_rate": 1.9749475905048114e-05, "loss": 1.3513, "step": 3635 }, { "epoch": 0.1, "learning_rate": 1.9749279121818235e-05, "loss": 1.3757, "step": 3636 }, { "epoch": 0.1, "learning_rate": 1.9749082262314585e-05, "loss": 1.4741, "step": 3637 }, { "epoch": 0.1, "learning_rate": 1.9748885326538695e-05, "loss": 1.5571, "step": 3638 }, { "epoch": 0.1, "learning_rate": 1.9748688314492115e-05, "loss": 1.4395, "step": 3639 }, { "epoch": 0.1, "learning_rate": 1.974849122617638e-05, "loss": 1.5508, "step": 3640 }, { "epoch": 0.1, "learning_rate": 1.9748294061593033e-05, "loss": 1.3708, "step": 3641 }, { "epoch": 0.1, "learning_rate": 1.9748096820743617e-05, "loss": 1.3958, "step": 3642 }, { "epoch": 0.1, "learning_rate": 1.9747899503629675e-05, "loss": 1.5168, "step": 3643 }, { "epoch": 0.1, "learning_rate": 1.9747702110252752e-05, "loss": 1.3994, "step": 3644 }, { "epoch": 0.1, "learning_rate": 1.974750464061439e-05, "loss": 1.5581, "step": 3645 }, { "epoch": 0.1, "learning_rate": 1.9747307094716138e-05, "loss": 1.5833, "step": 3646 }, { "epoch": 0.1, "learning_rate": 1.974710947255954e-05, "loss": 1.3965, "step": 3647 }, { "epoch": 0.1, "learning_rate": 1.9746911774146134e-05, "loss": 1.2451, "step": 3648 }, { "epoch": 0.1, "learning_rate": 1.974671399947748e-05, "loss": 1.4824, "step": 3649 }, { "epoch": 0.1, "learning_rate": 1.9746516148555114e-05, "loss": 1.5354, "step": 3650 }, { "epoch": 0.1, "learning_rate": 1.9746318221380592e-05, "loss": 1.5122, "step": 3651 }, { "epoch": 0.1, "learning_rate": 1.974612021795546e-05, "loss": 1.3408, "step": 3652 }, { "epoch": 0.1, "learning_rate": 1.9745922138281263e-05, "loss": 1.6812, "step": 3653 }, { "epoch": 0.1, "learning_rate": 1.974572398235956e-05, "loss": 1.5635, "step": 3654 }, { "epoch": 0.1, "learning_rate": 1.9745525750191888e-05, "loss": 1.4312, "step": 3655 }, { "epoch": 0.1, "learning_rate": 1.9745327441779808e-05, "loss": 1.4897, "step": 3656 }, { "epoch": 0.1, "learning_rate": 1.974512905712487e-05, "loss": 1.3457, "step": 3657 }, { "epoch": 0.1, "learning_rate": 1.9744930596228623e-05, "loss": 1.4583, "step": 3658 }, { "epoch": 0.1, "learning_rate": 1.9744732059092625e-05, "loss": 1.4204, "step": 3659 }, { "epoch": 0.1, "learning_rate": 1.974453344571842e-05, "loss": 1.3276, "step": 3660 }, { "epoch": 0.1, "learning_rate": 1.9744334756107572e-05, "loss": 1.3958, "step": 3661 }, { "epoch": 0.1, "learning_rate": 1.974413599026163e-05, "loss": 1.4932, "step": 3662 }, { "epoch": 0.1, "learning_rate": 1.974393714818215e-05, "loss": 1.3799, "step": 3663 }, { "epoch": 0.1, "learning_rate": 1.9743738229870687e-05, "loss": 1.5488, "step": 3664 }, { "epoch": 0.1, "learning_rate": 1.97435392353288e-05, "loss": 1.48, "step": 3665 }, { "epoch": 0.1, "learning_rate": 1.9743340164558038e-05, "loss": 1.5127, "step": 3666 }, { "epoch": 0.1, "learning_rate": 1.974314101755997e-05, "loss": 1.668, "step": 3667 }, { "epoch": 0.1, "learning_rate": 1.9742941794336147e-05, "loss": 1.405, "step": 3668 }, { "epoch": 0.1, "learning_rate": 1.974274249488813e-05, "loss": 1.563, "step": 3669 }, { "epoch": 0.1, "learning_rate": 1.9742543119217472e-05, "loss": 1.5796, "step": 3670 }, { "epoch": 0.1, "learning_rate": 1.9742343667325743e-05, "loss": 1.498, "step": 3671 }, { "epoch": 0.1, "learning_rate": 1.9742144139214495e-05, "loss": 1.5479, "step": 3672 }, { "epoch": 0.1, "learning_rate": 1.9741944534885292e-05, "loss": 1.5, "step": 3673 }, { "epoch": 0.1, "learning_rate": 1.97417448543397e-05, "loss": 1.4023, "step": 3674 }, { "epoch": 0.1, "learning_rate": 1.9741545097579277e-05, "loss": 1.4023, "step": 3675 }, { "epoch": 0.1, "learning_rate": 1.974134526460558e-05, "loss": 1.4138, "step": 3676 }, { "epoch": 0.1, "learning_rate": 1.9741145355420184e-05, "loss": 1.4565, "step": 3677 }, { "epoch": 0.1, "learning_rate": 1.9740945370024645e-05, "loss": 1.4888, "step": 3678 }, { "epoch": 0.1, "learning_rate": 1.974074530842053e-05, "loss": 1.4971, "step": 3679 }, { "epoch": 0.1, "learning_rate": 1.9740545170609405e-05, "loss": 1.481, "step": 3680 }, { "epoch": 0.1, "learning_rate": 1.9740344956592836e-05, "loss": 1.4385, "step": 3681 }, { "epoch": 0.1, "learning_rate": 1.9740144666372388e-05, "loss": 1.5181, "step": 3682 }, { "epoch": 0.1, "learning_rate": 1.9739944299949624e-05, "loss": 1.3806, "step": 3683 }, { "epoch": 0.1, "learning_rate": 1.973974385732612e-05, "loss": 1.3979, "step": 3684 }, { "epoch": 0.1, "learning_rate": 1.973954333850344e-05, "loss": 1.5088, "step": 3685 }, { "epoch": 0.1, "learning_rate": 1.9739342743483153e-05, "loss": 1.553, "step": 3686 }, { "epoch": 0.1, "learning_rate": 1.9739142072266825e-05, "loss": 1.3076, "step": 3687 }, { "epoch": 0.1, "learning_rate": 1.973894132485603e-05, "loss": 1.448, "step": 3688 }, { "epoch": 0.1, "learning_rate": 1.9738740501252337e-05, "loss": 1.446, "step": 3689 }, { "epoch": 0.1, "learning_rate": 1.973853960145732e-05, "loss": 1.5227, "step": 3690 }, { "epoch": 0.1, "learning_rate": 1.973833862547255e-05, "loss": 1.5586, "step": 3691 }, { "epoch": 0.1, "learning_rate": 1.9738137573299594e-05, "loss": 1.521, "step": 3692 }, { "epoch": 0.1, "learning_rate": 1.9737936444940032e-05, "loss": 1.2944, "step": 3693 }, { "epoch": 0.1, "learning_rate": 1.9737735240395433e-05, "loss": 1.4229, "step": 3694 }, { "epoch": 0.1, "learning_rate": 1.9737533959667373e-05, "loss": 1.3994, "step": 3695 }, { "epoch": 0.1, "learning_rate": 1.9737332602757426e-05, "loss": 1.3181, "step": 3696 }, { "epoch": 0.1, "learning_rate": 1.9737131169667167e-05, "loss": 1.4333, "step": 3697 }, { "epoch": 0.1, "learning_rate": 1.9736929660398172e-05, "loss": 1.4146, "step": 3698 }, { "epoch": 0.1, "learning_rate": 1.9736728074952018e-05, "loss": 1.3772, "step": 3699 }, { "epoch": 0.1, "learning_rate": 1.9736526413330283e-05, "loss": 1.4514, "step": 3700 }, { "epoch": 0.1, "learning_rate": 1.9736324675534544e-05, "loss": 1.54, "step": 3701 }, { "epoch": 0.1, "learning_rate": 1.973612286156638e-05, "loss": 1.4717, "step": 3702 }, { "epoch": 0.1, "learning_rate": 1.9735920971427366e-05, "loss": 1.5493, "step": 3703 }, { "epoch": 0.1, "learning_rate": 1.9735719005119084e-05, "loss": 1.3301, "step": 3704 }, { "epoch": 0.1, "learning_rate": 1.9735516962643117e-05, "loss": 1.4651, "step": 3705 }, { "epoch": 0.1, "learning_rate": 1.9735314844001046e-05, "loss": 1.7393, "step": 3706 }, { "epoch": 0.1, "learning_rate": 1.9735112649194446e-05, "loss": 1.5801, "step": 3707 }, { "epoch": 0.1, "learning_rate": 1.9734910378224904e-05, "loss": 1.5288, "step": 3708 }, { "epoch": 0.1, "learning_rate": 1.9734708031093998e-05, "loss": 1.3374, "step": 3709 }, { "epoch": 0.1, "learning_rate": 1.9734505607803314e-05, "loss": 1.457, "step": 3710 }, { "epoch": 0.1, "learning_rate": 1.9734303108354437e-05, "loss": 1.3726, "step": 3711 }, { "epoch": 0.1, "learning_rate": 1.9734100532748953e-05, "loss": 1.4453, "step": 3712 }, { "epoch": 0.1, "learning_rate": 1.9733897880988437e-05, "loss": 1.3489, "step": 3713 }, { "epoch": 0.1, "learning_rate": 1.9733695153074487e-05, "loss": 1.3293, "step": 3714 }, { "epoch": 0.1, "learning_rate": 1.973349234900868e-05, "loss": 1.4604, "step": 3715 }, { "epoch": 0.1, "learning_rate": 1.973328946879261e-05, "loss": 1.4458, "step": 3716 }, { "epoch": 0.1, "learning_rate": 1.9733086512427856e-05, "loss": 1.3416, "step": 3717 }, { "epoch": 0.1, "learning_rate": 1.9732883479916012e-05, "loss": 1.4419, "step": 3718 }, { "epoch": 0.1, "learning_rate": 1.973268037125866e-05, "loss": 1.2598, "step": 3719 }, { "epoch": 0.1, "learning_rate": 1.9732477186457398e-05, "loss": 1.342, "step": 3720 }, { "epoch": 0.1, "learning_rate": 1.973227392551381e-05, "loss": 1.5361, "step": 3721 }, { "epoch": 0.1, "learning_rate": 1.9732070588429487e-05, "loss": 1.4712, "step": 3722 }, { "epoch": 0.1, "learning_rate": 1.973186717520602e-05, "loss": 1.5767, "step": 3723 }, { "epoch": 0.1, "learning_rate": 1.9731663685845e-05, "loss": 1.3184, "step": 3724 }, { "epoch": 0.1, "learning_rate": 1.9731460120348023e-05, "loss": 1.4656, "step": 3725 }, { "epoch": 0.1, "learning_rate": 1.9731256478716677e-05, "loss": 1.4775, "step": 3726 }, { "epoch": 0.1, "learning_rate": 1.973105276095255e-05, "loss": 1.4302, "step": 3727 }, { "epoch": 0.1, "learning_rate": 1.973084896705725e-05, "loss": 1.8047, "step": 3728 }, { "epoch": 0.1, "learning_rate": 1.973064509703236e-05, "loss": 1.4883, "step": 3729 }, { "epoch": 0.1, "learning_rate": 1.9730441150879477e-05, "loss": 1.4817, "step": 3730 }, { "epoch": 0.1, "learning_rate": 1.9730237128600202e-05, "loss": 1.2944, "step": 3731 }, { "epoch": 0.1, "learning_rate": 1.973003303019612e-05, "loss": 1.3459, "step": 3732 }, { "epoch": 0.1, "learning_rate": 1.9729828855668843e-05, "loss": 1.4121, "step": 3733 }, { "epoch": 0.1, "learning_rate": 1.9729624605019958e-05, "loss": 1.5488, "step": 3734 }, { "epoch": 0.1, "learning_rate": 1.972942027825106e-05, "loss": 1.3152, "step": 3735 }, { "epoch": 0.1, "learning_rate": 1.972921587536376e-05, "loss": 1.335, "step": 3736 }, { "epoch": 0.1, "learning_rate": 1.9729011396359646e-05, "loss": 1.4841, "step": 3737 }, { "epoch": 0.1, "learning_rate": 1.9728806841240322e-05, "loss": 1.4849, "step": 3738 }, { "epoch": 0.1, "learning_rate": 1.972860221000739e-05, "loss": 1.3716, "step": 3739 }, { "epoch": 0.1, "learning_rate": 1.9728397502662447e-05, "loss": 1.3687, "step": 3740 }, { "epoch": 0.1, "learning_rate": 1.9728192719207097e-05, "loss": 1.5317, "step": 3741 }, { "epoch": 0.1, "learning_rate": 1.9727987859642943e-05, "loss": 1.4927, "step": 3742 }, { "epoch": 0.1, "learning_rate": 1.9727782923971584e-05, "loss": 1.5229, "step": 3743 }, { "epoch": 0.1, "learning_rate": 1.9727577912194627e-05, "loss": 1.4136, "step": 3744 }, { "epoch": 0.1, "learning_rate": 1.9727372824313677e-05, "loss": 1.3945, "step": 3745 }, { "epoch": 0.1, "learning_rate": 1.9727167660330334e-05, "loss": 1.5374, "step": 3746 }, { "epoch": 0.1, "learning_rate": 1.9726962420246203e-05, "loss": 1.5815, "step": 3747 }, { "epoch": 0.1, "learning_rate": 1.9726757104062898e-05, "loss": 1.5679, "step": 3748 }, { "epoch": 0.1, "learning_rate": 1.9726551711782014e-05, "loss": 1.4336, "step": 3749 }, { "epoch": 0.1, "learning_rate": 1.9726346243405167e-05, "loss": 1.4268, "step": 3750 }, { "epoch": 0.1, "learning_rate": 1.9726140698933956e-05, "loss": 1.7007, "step": 3751 }, { "epoch": 0.1, "learning_rate": 1.9725935078369995e-05, "loss": 1.54, "step": 3752 }, { "epoch": 0.1, "learning_rate": 1.9725729381714895e-05, "loss": 1.553, "step": 3753 }, { "epoch": 0.1, "learning_rate": 1.9725523608970257e-05, "loss": 1.6357, "step": 3754 }, { "epoch": 0.1, "learning_rate": 1.97253177601377e-05, "loss": 1.4614, "step": 3755 }, { "epoch": 0.1, "learning_rate": 1.9725111835218825e-05, "loss": 1.4639, "step": 3756 }, { "epoch": 0.1, "learning_rate": 1.972490583421525e-05, "loss": 1.4297, "step": 3757 }, { "epoch": 0.1, "learning_rate": 1.9724699757128587e-05, "loss": 1.5405, "step": 3758 }, { "epoch": 0.1, "learning_rate": 1.9724493603960443e-05, "loss": 1.418, "step": 3759 }, { "epoch": 0.1, "learning_rate": 1.9724287374712436e-05, "loss": 1.4087, "step": 3760 }, { "epoch": 0.1, "learning_rate": 1.972408106938618e-05, "loss": 1.5527, "step": 3761 }, { "epoch": 0.1, "learning_rate": 1.9723874687983282e-05, "loss": 1.5142, "step": 3762 }, { "epoch": 0.1, "learning_rate": 1.972366823050536e-05, "loss": 1.3823, "step": 3763 }, { "epoch": 0.1, "learning_rate": 1.9723461696954032e-05, "loss": 1.4158, "step": 3764 }, { "epoch": 0.1, "learning_rate": 1.972325508733091e-05, "loss": 1.4756, "step": 3765 }, { "epoch": 0.1, "learning_rate": 1.9723048401637618e-05, "loss": 1.4141, "step": 3766 }, { "epoch": 0.1, "learning_rate": 1.9722841639875762e-05, "loss": 1.4429, "step": 3767 }, { "epoch": 0.1, "learning_rate": 1.9722634802046966e-05, "loss": 1.5391, "step": 3768 }, { "epoch": 0.1, "learning_rate": 1.972242788815285e-05, "loss": 1.4734, "step": 3769 }, { "epoch": 0.1, "learning_rate": 1.9722220898195025e-05, "loss": 1.2545, "step": 3770 }, { "epoch": 0.1, "learning_rate": 1.972201383217512e-05, "loss": 1.2891, "step": 3771 }, { "epoch": 0.1, "learning_rate": 1.972180669009475e-05, "loss": 1.4912, "step": 3772 }, { "epoch": 0.1, "learning_rate": 1.972159947195553e-05, "loss": 1.4666, "step": 3773 }, { "epoch": 0.1, "learning_rate": 1.9721392177759095e-05, "loss": 1.4495, "step": 3774 }, { "epoch": 0.1, "learning_rate": 1.9721184807507056e-05, "loss": 1.4631, "step": 3775 }, { "epoch": 0.1, "learning_rate": 1.972097736120104e-05, "loss": 1.5955, "step": 3776 }, { "epoch": 0.1, "learning_rate": 1.9720769838842665e-05, "loss": 1.5054, "step": 3777 }, { "epoch": 0.1, "learning_rate": 1.972056224043356e-05, "loss": 1.3306, "step": 3778 }, { "epoch": 0.1, "learning_rate": 1.9720354565975346e-05, "loss": 1.771, "step": 3779 }, { "epoch": 0.1, "learning_rate": 1.9720146815469647e-05, "loss": 1.325, "step": 3780 }, { "epoch": 0.1, "learning_rate": 1.9719938988918092e-05, "loss": 1.4888, "step": 3781 }, { "epoch": 0.1, "learning_rate": 1.971973108632231e-05, "loss": 1.5867, "step": 3782 }, { "epoch": 0.1, "learning_rate": 1.971952310768391e-05, "loss": 1.3059, "step": 3783 }, { "epoch": 0.1, "learning_rate": 1.971931505300454e-05, "loss": 1.5056, "step": 3784 }, { "epoch": 0.1, "learning_rate": 1.971910692228582e-05, "loss": 1.4871, "step": 3785 }, { "epoch": 0.1, "learning_rate": 1.9718898715529374e-05, "loss": 1.3235, "step": 3786 }, { "epoch": 0.1, "learning_rate": 1.9718690432736838e-05, "loss": 1.5078, "step": 3787 }, { "epoch": 0.1, "learning_rate": 1.9718482073909837e-05, "loss": 1.4312, "step": 3788 }, { "epoch": 0.1, "learning_rate": 1.9718273639050004e-05, "loss": 1.3611, "step": 3789 }, { "epoch": 0.1, "learning_rate": 1.9718065128158966e-05, "loss": 1.4595, "step": 3790 }, { "epoch": 0.1, "learning_rate": 1.9717856541238355e-05, "loss": 1.645, "step": 3791 }, { "epoch": 0.1, "learning_rate": 1.9717647878289802e-05, "loss": 1.438, "step": 3792 }, { "epoch": 0.1, "learning_rate": 1.9717439139314946e-05, "loss": 1.3875, "step": 3793 }, { "epoch": 0.1, "learning_rate": 1.9717230324315414e-05, "loss": 1.4346, "step": 3794 }, { "epoch": 0.1, "learning_rate": 1.9717021433292842e-05, "loss": 1.3862, "step": 3795 }, { "epoch": 0.1, "learning_rate": 1.9716812466248862e-05, "loss": 1.3669, "step": 3796 }, { "epoch": 0.1, "learning_rate": 1.9716603423185113e-05, "loss": 1.4097, "step": 3797 }, { "epoch": 0.1, "learning_rate": 1.971639430410323e-05, "loss": 1.3384, "step": 3798 }, { "epoch": 0.1, "learning_rate": 1.971618510900484e-05, "loss": 1.2966, "step": 3799 }, { "epoch": 0.1, "learning_rate": 1.971597583789159e-05, "loss": 1.4678, "step": 3800 }, { "epoch": 0.1, "learning_rate": 1.9715766490765115e-05, "loss": 1.458, "step": 3801 }, { "epoch": 0.1, "learning_rate": 1.971555706762705e-05, "loss": 1.3313, "step": 3802 }, { "epoch": 0.1, "learning_rate": 1.9715347568479037e-05, "loss": 1.4719, "step": 3803 }, { "epoch": 0.1, "learning_rate": 1.971513799332271e-05, "loss": 1.3987, "step": 3804 }, { "epoch": 0.1, "learning_rate": 1.9714928342159714e-05, "loss": 1.4946, "step": 3805 }, { "epoch": 0.1, "learning_rate": 1.9714718614991685e-05, "loss": 1.4775, "step": 3806 }, { "epoch": 0.1, "learning_rate": 1.9714508811820267e-05, "loss": 1.3386, "step": 3807 }, { "epoch": 0.1, "learning_rate": 1.97142989326471e-05, "loss": 1.4626, "step": 3808 }, { "epoch": 0.1, "learning_rate": 1.9714088977473828e-05, "loss": 1.4641, "step": 3809 }, { "epoch": 0.1, "learning_rate": 1.971387894630209e-05, "loss": 1.4424, "step": 3810 }, { "epoch": 0.1, "learning_rate": 1.971366883913353e-05, "loss": 1.4634, "step": 3811 }, { "epoch": 0.1, "learning_rate": 1.9713458655969794e-05, "loss": 1.5347, "step": 3812 }, { "epoch": 0.1, "learning_rate": 1.9713248396812524e-05, "loss": 1.4639, "step": 3813 }, { "epoch": 0.1, "learning_rate": 1.9713038061663368e-05, "loss": 1.4958, "step": 3814 }, { "epoch": 0.1, "learning_rate": 1.9712827650523966e-05, "loss": 1.3535, "step": 3815 }, { "epoch": 0.1, "learning_rate": 1.9712617163395974e-05, "loss": 1.4116, "step": 3816 }, { "epoch": 0.1, "learning_rate": 1.9712406600281026e-05, "loss": 1.2825, "step": 3817 }, { "epoch": 0.1, "learning_rate": 1.9712195961180778e-05, "loss": 1.5164, "step": 3818 }, { "epoch": 0.1, "learning_rate": 1.9711985246096877e-05, "loss": 1.4216, "step": 3819 }, { "epoch": 0.1, "learning_rate": 1.971177445503097e-05, "loss": 1.4419, "step": 3820 }, { "epoch": 0.1, "learning_rate": 1.9711563587984707e-05, "loss": 1.4771, "step": 3821 }, { "epoch": 0.1, "learning_rate": 1.9711352644959737e-05, "loss": 1.4844, "step": 3822 }, { "epoch": 0.1, "learning_rate": 1.9711141625957708e-05, "loss": 1.2617, "step": 3823 }, { "epoch": 0.1, "learning_rate": 1.9710930530980275e-05, "loss": 1.4473, "step": 3824 }, { "epoch": 0.1, "learning_rate": 1.971071936002909e-05, "loss": 1.3462, "step": 3825 }, { "epoch": 0.1, "learning_rate": 1.97105081131058e-05, "loss": 1.3274, "step": 3826 }, { "epoch": 0.1, "learning_rate": 1.9710296790212062e-05, "loss": 1.3843, "step": 3827 }, { "epoch": 0.1, "learning_rate": 1.971008539134953e-05, "loss": 1.3989, "step": 3828 }, { "epoch": 0.1, "learning_rate": 1.9709873916519853e-05, "loss": 1.584, "step": 3829 }, { "epoch": 0.1, "learning_rate": 1.9709662365724688e-05, "loss": 1.4609, "step": 3830 }, { "epoch": 0.1, "learning_rate": 1.970945073896569e-05, "loss": 1.4194, "step": 3831 }, { "epoch": 0.1, "learning_rate": 1.9709239036244517e-05, "loss": 1.5371, "step": 3832 }, { "epoch": 0.1, "learning_rate": 1.9709027257562825e-05, "loss": 1.4263, "step": 3833 }, { "epoch": 0.1, "learning_rate": 1.9708815402922265e-05, "loss": 1.4927, "step": 3834 }, { "epoch": 0.1, "learning_rate": 1.9708603472324502e-05, "loss": 1.4009, "step": 3835 }, { "epoch": 0.1, "learning_rate": 1.9708391465771188e-05, "loss": 1.386, "step": 3836 }, { "epoch": 0.1, "learning_rate": 1.970817938326399e-05, "loss": 1.4451, "step": 3837 }, { "epoch": 0.1, "learning_rate": 1.9707967224804555e-05, "loss": 1.5515, "step": 3838 }, { "epoch": 0.1, "learning_rate": 1.9707754990394553e-05, "loss": 1.3994, "step": 3839 }, { "epoch": 0.1, "learning_rate": 1.970754268003564e-05, "loss": 1.6436, "step": 3840 }, { "epoch": 0.1, "learning_rate": 1.970733029372948e-05, "loss": 1.4868, "step": 3841 }, { "epoch": 0.1, "learning_rate": 1.970711783147773e-05, "loss": 1.7944, "step": 3842 }, { "epoch": 0.1, "learning_rate": 1.9706905293282054e-05, "loss": 1.2935, "step": 3843 }, { "epoch": 0.1, "learning_rate": 1.9706692679144116e-05, "loss": 1.3486, "step": 3844 }, { "epoch": 0.11, "learning_rate": 1.970647998906558e-05, "loss": 1.3948, "step": 3845 }, { "epoch": 0.11, "learning_rate": 1.9706267223048106e-05, "loss": 1.5825, "step": 3846 }, { "epoch": 0.11, "learning_rate": 1.9706054381093366e-05, "loss": 1.4854, "step": 3847 }, { "epoch": 0.11, "learning_rate": 1.970584146320302e-05, "loss": 1.6111, "step": 3848 }, { "epoch": 0.11, "learning_rate": 1.970562846937873e-05, "loss": 1.4648, "step": 3849 }, { "epoch": 0.11, "learning_rate": 1.9705415399622173e-05, "loss": 1.4141, "step": 3850 }, { "epoch": 0.11, "learning_rate": 1.9705202253935004e-05, "loss": 1.4543, "step": 3851 }, { "epoch": 0.11, "learning_rate": 1.97049890323189e-05, "loss": 1.4204, "step": 3852 }, { "epoch": 0.11, "learning_rate": 1.970477573477552e-05, "loss": 1.3521, "step": 3853 }, { "epoch": 0.11, "learning_rate": 1.9704562361306546e-05, "loss": 1.3677, "step": 3854 }, { "epoch": 0.11, "learning_rate": 1.9704348911913636e-05, "loss": 1.5198, "step": 3855 }, { "epoch": 0.11, "learning_rate": 1.970413538659846e-05, "loss": 1.4004, "step": 3856 }, { "epoch": 0.11, "learning_rate": 1.9703921785362698e-05, "loss": 1.332, "step": 3857 }, { "epoch": 0.11, "learning_rate": 1.9703708108208013e-05, "loss": 1.5361, "step": 3858 }, { "epoch": 0.11, "learning_rate": 1.9703494355136075e-05, "loss": 1.5547, "step": 3859 }, { "epoch": 0.11, "learning_rate": 1.9703280526148566e-05, "loss": 1.3784, "step": 3860 }, { "epoch": 0.11, "learning_rate": 1.9703066621247145e-05, "loss": 1.4575, "step": 3861 }, { "epoch": 0.11, "learning_rate": 1.97028526404335e-05, "loss": 1.4341, "step": 3862 }, { "epoch": 0.11, "learning_rate": 1.9702638583709297e-05, "loss": 1.5447, "step": 3863 }, { "epoch": 0.11, "learning_rate": 1.9702424451076214e-05, "loss": 1.4524, "step": 3864 }, { "epoch": 0.11, "learning_rate": 1.970221024253592e-05, "loss": 1.4097, "step": 3865 }, { "epoch": 0.11, "learning_rate": 1.97019959580901e-05, "loss": 1.4895, "step": 3866 }, { "epoch": 0.11, "learning_rate": 1.9701781597740424e-05, "loss": 1.5771, "step": 3867 }, { "epoch": 0.11, "learning_rate": 1.970156716148857e-05, "loss": 1.5107, "step": 3868 }, { "epoch": 0.11, "learning_rate": 1.970135264933622e-05, "loss": 1.4321, "step": 3869 }, { "epoch": 0.11, "learning_rate": 1.9701138061285047e-05, "loss": 1.3142, "step": 3870 }, { "epoch": 0.11, "learning_rate": 1.9700923397336728e-05, "loss": 1.5415, "step": 3871 }, { "epoch": 0.11, "learning_rate": 1.9700708657492948e-05, "loss": 1.5366, "step": 3872 }, { "epoch": 0.11, "learning_rate": 1.9700493841755386e-05, "loss": 1.3535, "step": 3873 }, { "epoch": 0.11, "learning_rate": 1.9700278950125722e-05, "loss": 1.5234, "step": 3874 }, { "epoch": 0.11, "learning_rate": 1.9700063982605636e-05, "loss": 1.5576, "step": 3875 }, { "epoch": 0.11, "learning_rate": 1.9699848939196812e-05, "loss": 1.7866, "step": 3876 }, { "epoch": 0.11, "learning_rate": 1.969963381990093e-05, "loss": 1.4937, "step": 3877 }, { "epoch": 0.11, "learning_rate": 1.9699418624719673e-05, "loss": 1.2219, "step": 3878 }, { "epoch": 0.11, "learning_rate": 1.9699203353654725e-05, "loss": 1.342, "step": 3879 }, { "epoch": 0.11, "learning_rate": 1.9698988006707775e-05, "loss": 1.623, "step": 3880 }, { "epoch": 0.11, "learning_rate": 1.96987725838805e-05, "loss": 1.3008, "step": 3881 }, { "epoch": 0.11, "learning_rate": 1.969855708517459e-05, "loss": 1.4016, "step": 3882 }, { "epoch": 0.11, "learning_rate": 1.969834151059173e-05, "loss": 1.343, "step": 3883 }, { "epoch": 0.11, "learning_rate": 1.9698125860133608e-05, "loss": 1.6606, "step": 3884 }, { "epoch": 0.11, "learning_rate": 1.969791013380191e-05, "loss": 1.3586, "step": 3885 }, { "epoch": 0.11, "learning_rate": 1.969769433159832e-05, "loss": 1.519, "step": 3886 }, { "epoch": 0.11, "learning_rate": 1.969747845352453e-05, "loss": 1.417, "step": 3887 }, { "epoch": 0.11, "learning_rate": 1.9697262499582233e-05, "loss": 1.4595, "step": 3888 }, { "epoch": 0.11, "learning_rate": 1.969704646977311e-05, "loss": 1.3396, "step": 3889 }, { "epoch": 0.11, "learning_rate": 1.9696830364098857e-05, "loss": 1.4097, "step": 3890 }, { "epoch": 0.11, "learning_rate": 1.969661418256116e-05, "loss": 1.3608, "step": 3891 }, { "epoch": 0.11, "learning_rate": 1.969639792516172e-05, "loss": 1.5378, "step": 3892 }, { "epoch": 0.11, "learning_rate": 1.9696181591902217e-05, "loss": 1.4824, "step": 3893 }, { "epoch": 0.11, "learning_rate": 1.9695965182784347e-05, "loss": 1.4944, "step": 3894 }, { "epoch": 0.11, "learning_rate": 1.9695748697809808e-05, "loss": 1.3215, "step": 3895 }, { "epoch": 0.11, "learning_rate": 1.969553213698029e-05, "loss": 1.5391, "step": 3896 }, { "epoch": 0.11, "learning_rate": 1.9695315500297488e-05, "loss": 1.4121, "step": 3897 }, { "epoch": 0.11, "learning_rate": 1.9695098787763096e-05, "loss": 1.4453, "step": 3898 }, { "epoch": 0.11, "learning_rate": 1.969488199937881e-05, "loss": 1.4238, "step": 3899 }, { "epoch": 0.11, "learning_rate": 1.969466513514633e-05, "loss": 1.334, "step": 3900 }, { "epoch": 0.11, "learning_rate": 1.9694448195067344e-05, "loss": 1.4839, "step": 3901 }, { "epoch": 0.11, "learning_rate": 1.9694231179143552e-05, "loss": 1.4403, "step": 3902 }, { "epoch": 0.11, "learning_rate": 1.969401408737666e-05, "loss": 1.6587, "step": 3903 }, { "epoch": 0.11, "learning_rate": 1.9693796919768354e-05, "loss": 1.4316, "step": 3904 }, { "epoch": 0.11, "learning_rate": 1.9693579676320345e-05, "loss": 1.364, "step": 3905 }, { "epoch": 0.11, "learning_rate": 1.969336235703432e-05, "loss": 1.426, "step": 3906 }, { "epoch": 0.11, "learning_rate": 1.9693144961911994e-05, "loss": 1.4299, "step": 3907 }, { "epoch": 0.11, "learning_rate": 1.9692927490955055e-05, "loss": 1.4958, "step": 3908 }, { "epoch": 0.11, "learning_rate": 1.969270994416521e-05, "loss": 1.4258, "step": 3909 }, { "epoch": 0.11, "learning_rate": 1.9692492321544162e-05, "loss": 1.521, "step": 3910 }, { "epoch": 0.11, "learning_rate": 1.969227462309361e-05, "loss": 1.5898, "step": 3911 }, { "epoch": 0.11, "learning_rate": 1.969205684881526e-05, "loss": 1.3477, "step": 3912 }, { "epoch": 0.11, "learning_rate": 1.9691838998710816e-05, "loss": 1.3162, "step": 3913 }, { "epoch": 0.11, "learning_rate": 1.969162107278198e-05, "loss": 1.3569, "step": 3914 }, { "epoch": 0.11, "learning_rate": 1.9691403071030456e-05, "loss": 1.5332, "step": 3915 }, { "epoch": 0.11, "learning_rate": 1.9691184993457952e-05, "loss": 1.4448, "step": 3916 }, { "epoch": 0.11, "learning_rate": 1.9690966840066174e-05, "loss": 1.1736, "step": 3917 }, { "epoch": 0.11, "learning_rate": 1.969074861085683e-05, "loss": 1.5752, "step": 3918 }, { "epoch": 0.11, "learning_rate": 1.9690530305831626e-05, "loss": 1.5046, "step": 3919 }, { "epoch": 0.11, "learning_rate": 1.9690311924992268e-05, "loss": 1.4375, "step": 3920 }, { "epoch": 0.11, "learning_rate": 1.9690093468340465e-05, "loss": 1.4868, "step": 3921 }, { "epoch": 0.11, "learning_rate": 1.968987493587793e-05, "loss": 1.5342, "step": 3922 }, { "epoch": 0.11, "learning_rate": 1.968965632760637e-05, "loss": 1.605, "step": 3923 }, { "epoch": 0.11, "learning_rate": 1.9689437643527494e-05, "loss": 1.4663, "step": 3924 }, { "epoch": 0.11, "learning_rate": 1.9689218883643013e-05, "loss": 1.4539, "step": 3925 }, { "epoch": 0.11, "learning_rate": 1.9689000047954642e-05, "loss": 1.593, "step": 3926 }, { "epoch": 0.11, "learning_rate": 1.968878113646409e-05, "loss": 1.6382, "step": 3927 }, { "epoch": 0.11, "learning_rate": 1.968856214917307e-05, "loss": 1.4453, "step": 3928 }, { "epoch": 0.11, "learning_rate": 1.9688343086083295e-05, "loss": 1.4712, "step": 3929 }, { "epoch": 0.11, "learning_rate": 1.968812394719648e-05, "loss": 1.5581, "step": 3930 }, { "epoch": 0.11, "learning_rate": 1.968790473251434e-05, "loss": 1.3103, "step": 3931 }, { "epoch": 0.11, "learning_rate": 1.9687685442038587e-05, "loss": 1.5005, "step": 3932 }, { "epoch": 0.11, "learning_rate": 1.9687466075770944e-05, "loss": 1.5322, "step": 3933 }, { "epoch": 0.11, "learning_rate": 1.9687246633713116e-05, "loss": 1.3806, "step": 3934 }, { "epoch": 0.11, "learning_rate": 1.9687027115866826e-05, "loss": 1.4485, "step": 3935 }, { "epoch": 0.11, "learning_rate": 1.968680752223379e-05, "loss": 1.5415, "step": 3936 }, { "epoch": 0.11, "learning_rate": 1.9686587852815733e-05, "loss": 1.3735, "step": 3937 }, { "epoch": 0.11, "learning_rate": 1.9686368107614365e-05, "loss": 1.4385, "step": 3938 }, { "epoch": 0.11, "learning_rate": 1.9686148286631405e-05, "loss": 1.5308, "step": 3939 }, { "epoch": 0.11, "learning_rate": 1.9685928389868575e-05, "loss": 1.304, "step": 3940 }, { "epoch": 0.11, "learning_rate": 1.96857084173276e-05, "loss": 1.5332, "step": 3941 }, { "epoch": 0.11, "learning_rate": 1.9685488369010195e-05, "loss": 1.5, "step": 3942 }, { "epoch": 0.11, "learning_rate": 1.9685268244918084e-05, "loss": 1.4707, "step": 3943 }, { "epoch": 0.11, "learning_rate": 1.9685048045052988e-05, "loss": 1.4509, "step": 3944 }, { "epoch": 0.11, "learning_rate": 1.968482776941663e-05, "loss": 1.3882, "step": 3945 }, { "epoch": 0.11, "learning_rate": 1.9684607418010733e-05, "loss": 1.4053, "step": 3946 }, { "epoch": 0.11, "learning_rate": 1.968438699083702e-05, "loss": 1.4797, "step": 3947 }, { "epoch": 0.11, "learning_rate": 1.968416648789722e-05, "loss": 1.3557, "step": 3948 }, { "epoch": 0.11, "learning_rate": 1.9683945909193056e-05, "loss": 1.439, "step": 3949 }, { "epoch": 0.11, "learning_rate": 1.968372525472625e-05, "loss": 1.4158, "step": 3950 }, { "epoch": 0.11, "learning_rate": 1.9683504524498535e-05, "loss": 1.4436, "step": 3951 }, { "epoch": 0.11, "learning_rate": 1.9683283718511634e-05, "loss": 1.5352, "step": 3952 }, { "epoch": 0.11, "learning_rate": 1.968306283676727e-05, "loss": 1.4575, "step": 3953 }, { "epoch": 0.11, "learning_rate": 1.9682841879267182e-05, "loss": 1.5034, "step": 3954 }, { "epoch": 0.11, "learning_rate": 1.9682620846013084e-05, "loss": 1.4102, "step": 3955 }, { "epoch": 0.11, "learning_rate": 1.9682399737006722e-05, "loss": 1.5381, "step": 3956 }, { "epoch": 0.11, "learning_rate": 1.9682178552249814e-05, "loss": 1.4919, "step": 3957 }, { "epoch": 0.11, "learning_rate": 1.968195729174409e-05, "loss": 1.5132, "step": 3958 }, { "epoch": 0.11, "learning_rate": 1.968173595549129e-05, "loss": 1.3254, "step": 3959 }, { "epoch": 0.11, "learning_rate": 1.968151454349314e-05, "loss": 1.4922, "step": 3960 }, { "epoch": 0.11, "learning_rate": 1.968129305575137e-05, "loss": 1.4966, "step": 3961 }, { "epoch": 0.11, "learning_rate": 1.968107149226772e-05, "loss": 1.3967, "step": 3962 }, { "epoch": 0.11, "learning_rate": 1.9680849853043914e-05, "loss": 1.3474, "step": 3963 }, { "epoch": 0.11, "learning_rate": 1.9680628138081694e-05, "loss": 1.3142, "step": 3964 }, { "epoch": 0.11, "learning_rate": 1.9680406347382793e-05, "loss": 1.5359, "step": 3965 }, { "epoch": 0.11, "learning_rate": 1.968018448094894e-05, "loss": 1.3816, "step": 3966 }, { "epoch": 0.11, "learning_rate": 1.967996253878188e-05, "loss": 1.5327, "step": 3967 }, { "epoch": 0.11, "learning_rate": 1.9679740520883345e-05, "loss": 1.491, "step": 3968 }, { "epoch": 0.11, "learning_rate": 1.967951842725507e-05, "loss": 1.4531, "step": 3969 }, { "epoch": 0.11, "learning_rate": 1.9679296257898794e-05, "loss": 1.4111, "step": 3970 }, { "epoch": 0.11, "learning_rate": 1.9679074012816254e-05, "loss": 1.488, "step": 3971 }, { "epoch": 0.11, "learning_rate": 1.9678851692009196e-05, "loss": 1.3176, "step": 3972 }, { "epoch": 0.11, "learning_rate": 1.9678629295479347e-05, "loss": 1.3667, "step": 3973 }, { "epoch": 0.11, "learning_rate": 1.9678406823228456e-05, "loss": 1.5352, "step": 3974 }, { "epoch": 0.11, "learning_rate": 1.9678184275258264e-05, "loss": 1.5198, "step": 3975 }, { "epoch": 0.11, "learning_rate": 1.9677961651570507e-05, "loss": 1.4844, "step": 3976 }, { "epoch": 0.11, "learning_rate": 1.9677738952166928e-05, "loss": 1.4404, "step": 3977 }, { "epoch": 0.11, "learning_rate": 1.9677516177049273e-05, "loss": 1.4155, "step": 3978 }, { "epoch": 0.11, "learning_rate": 1.967729332621928e-05, "loss": 1.4285, "step": 3979 }, { "epoch": 0.11, "learning_rate": 1.9677070399678696e-05, "loss": 1.4624, "step": 3980 }, { "epoch": 0.11, "learning_rate": 1.9676847397429265e-05, "loss": 1.4241, "step": 3981 }, { "epoch": 0.11, "learning_rate": 1.9676624319472726e-05, "loss": 1.4399, "step": 3982 }, { "epoch": 0.11, "learning_rate": 1.967640116581083e-05, "loss": 1.375, "step": 3983 }, { "epoch": 0.11, "learning_rate": 1.9676177936445322e-05, "loss": 1.4792, "step": 3984 }, { "epoch": 0.11, "learning_rate": 1.9675954631377946e-05, "loss": 1.4507, "step": 3985 }, { "epoch": 0.11, "learning_rate": 1.9675731250610456e-05, "loss": 1.4771, "step": 3986 }, { "epoch": 0.11, "learning_rate": 1.967550779414459e-05, "loss": 1.5107, "step": 3987 }, { "epoch": 0.11, "learning_rate": 1.9675284261982104e-05, "loss": 1.3914, "step": 3988 }, { "epoch": 0.11, "learning_rate": 1.967506065412474e-05, "loss": 1.5422, "step": 3989 }, { "epoch": 0.11, "learning_rate": 1.9674836970574253e-05, "loss": 1.3857, "step": 3990 }, { "epoch": 0.11, "learning_rate": 1.967461321133239e-05, "loss": 1.3091, "step": 3991 }, { "epoch": 0.11, "learning_rate": 1.9674389376400905e-05, "loss": 1.4409, "step": 3992 }, { "epoch": 0.11, "learning_rate": 1.9674165465781544e-05, "loss": 1.3325, "step": 3993 }, { "epoch": 0.11, "learning_rate": 1.9673941479476065e-05, "loss": 1.3596, "step": 3994 }, { "epoch": 0.11, "learning_rate": 1.9673717417486213e-05, "loss": 1.4937, "step": 3995 }, { "epoch": 0.11, "learning_rate": 1.9673493279813748e-05, "loss": 1.4658, "step": 3996 }, { "epoch": 0.11, "learning_rate": 1.967326906646042e-05, "loss": 1.2998, "step": 3997 }, { "epoch": 0.11, "learning_rate": 1.9673044777427977e-05, "loss": 1.4917, "step": 3998 }, { "epoch": 0.11, "learning_rate": 1.9672820412718186e-05, "loss": 1.8525, "step": 3999 }, { "epoch": 0.11, "learning_rate": 1.9672595972332798e-05, "loss": 1.5107, "step": 4000 }, { "epoch": 0.11, "learning_rate": 1.9672371456273564e-05, "loss": 1.4712, "step": 4001 }, { "epoch": 0.11, "learning_rate": 1.9672146864542247e-05, "loss": 1.5967, "step": 4002 }, { "epoch": 0.11, "learning_rate": 1.9671922197140597e-05, "loss": 1.4907, "step": 4003 }, { "epoch": 0.11, "learning_rate": 1.967169745407038e-05, "loss": 1.4478, "step": 4004 }, { "epoch": 0.11, "learning_rate": 1.9671472635333352e-05, "loss": 1.4463, "step": 4005 }, { "epoch": 0.11, "learning_rate": 1.9671247740931263e-05, "loss": 1.314, "step": 4006 }, { "epoch": 0.11, "learning_rate": 1.9671022770865883e-05, "loss": 1.4629, "step": 4007 }, { "epoch": 0.11, "learning_rate": 1.967079772513897e-05, "loss": 1.3726, "step": 4008 }, { "epoch": 0.11, "learning_rate": 1.967057260375228e-05, "loss": 1.4199, "step": 4009 }, { "epoch": 0.11, "learning_rate": 1.9670347406707578e-05, "loss": 1.5676, "step": 4010 }, { "epoch": 0.11, "learning_rate": 1.9670122134006626e-05, "loss": 1.2661, "step": 4011 }, { "epoch": 0.11, "learning_rate": 1.966989678565119e-05, "loss": 1.3008, "step": 4012 }, { "epoch": 0.11, "learning_rate": 1.966967136164302e-05, "loss": 1.3955, "step": 4013 }, { "epoch": 0.11, "learning_rate": 1.9669445861983893e-05, "loss": 1.3647, "step": 4014 }, { "epoch": 0.11, "learning_rate": 1.9669220286675566e-05, "loss": 1.5105, "step": 4015 }, { "epoch": 0.11, "learning_rate": 1.966899463571981e-05, "loss": 1.4646, "step": 4016 }, { "epoch": 0.11, "learning_rate": 1.966876890911839e-05, "loss": 1.5457, "step": 4017 }, { "epoch": 0.11, "learning_rate": 1.9668543106873058e-05, "loss": 1.4182, "step": 4018 }, { "epoch": 0.11, "learning_rate": 1.96683172289856e-05, "loss": 1.5117, "step": 4019 }, { "epoch": 0.11, "learning_rate": 1.9668091275457772e-05, "loss": 1.4373, "step": 4020 }, { "epoch": 0.11, "learning_rate": 1.966786524629134e-05, "loss": 1.5234, "step": 4021 }, { "epoch": 0.11, "learning_rate": 1.9667639141488083e-05, "loss": 1.5591, "step": 4022 }, { "epoch": 0.11, "learning_rate": 1.9667412961049755e-05, "loss": 1.4004, "step": 4023 }, { "epoch": 0.11, "learning_rate": 1.966718670497814e-05, "loss": 1.3579, "step": 4024 }, { "epoch": 0.11, "learning_rate": 1.9666960373275003e-05, "loss": 1.1458, "step": 4025 }, { "epoch": 0.11, "learning_rate": 1.9666733965942112e-05, "loss": 1.4028, "step": 4026 }, { "epoch": 0.11, "learning_rate": 1.966650748298124e-05, "loss": 1.3738, "step": 4027 }, { "epoch": 0.11, "learning_rate": 1.9666280924394157e-05, "loss": 1.4788, "step": 4028 }, { "epoch": 0.11, "learning_rate": 1.966605429018264e-05, "loss": 1.5288, "step": 4029 }, { "epoch": 0.11, "learning_rate": 1.966582758034846e-05, "loss": 1.6108, "step": 4030 }, { "epoch": 0.11, "learning_rate": 1.966560079489339e-05, "loss": 1.8066, "step": 4031 }, { "epoch": 0.11, "learning_rate": 1.9665373933819204e-05, "loss": 1.5708, "step": 4032 }, { "epoch": 0.11, "learning_rate": 1.9665146997127675e-05, "loss": 1.4492, "step": 4033 }, { "epoch": 0.11, "learning_rate": 1.9664919984820584e-05, "loss": 1.4512, "step": 4034 }, { "epoch": 0.11, "learning_rate": 1.96646928968997e-05, "loss": 1.481, "step": 4035 }, { "epoch": 0.11, "learning_rate": 1.9664465733366806e-05, "loss": 1.4453, "step": 4036 }, { "epoch": 0.11, "learning_rate": 1.966423849422368e-05, "loss": 1.5859, "step": 4037 }, { "epoch": 0.11, "learning_rate": 1.9664011179472092e-05, "loss": 1.8628, "step": 4038 }, { "epoch": 0.11, "learning_rate": 1.9663783789113827e-05, "loss": 1.4387, "step": 4039 }, { "epoch": 0.11, "learning_rate": 1.9663556323150658e-05, "loss": 1.4495, "step": 4040 }, { "epoch": 0.11, "learning_rate": 1.9663328781584373e-05, "loss": 1.4321, "step": 4041 }, { "epoch": 0.11, "learning_rate": 1.9663101164416743e-05, "loss": 1.427, "step": 4042 }, { "epoch": 0.11, "learning_rate": 1.966287347164956e-05, "loss": 1.3667, "step": 4043 }, { "epoch": 0.11, "learning_rate": 1.9662645703284592e-05, "loss": 1.4768, "step": 4044 }, { "epoch": 0.11, "learning_rate": 1.966241785932363e-05, "loss": 1.3818, "step": 4045 }, { "epoch": 0.11, "learning_rate": 1.9662189939768455e-05, "loss": 1.5186, "step": 4046 }, { "epoch": 0.11, "learning_rate": 1.966196194462085e-05, "loss": 1.7856, "step": 4047 }, { "epoch": 0.11, "learning_rate": 1.96617338738826e-05, "loss": 1.4751, "step": 4048 }, { "epoch": 0.11, "learning_rate": 1.9661505727555482e-05, "loss": 1.4521, "step": 4049 }, { "epoch": 0.11, "learning_rate": 1.966127750564129e-05, "loss": 1.3137, "step": 4050 }, { "epoch": 0.11, "learning_rate": 1.9661049208141804e-05, "loss": 1.5674, "step": 4051 }, { "epoch": 0.11, "learning_rate": 1.9660820835058813e-05, "loss": 1.5894, "step": 4052 }, { "epoch": 0.11, "learning_rate": 1.96605923863941e-05, "loss": 1.5337, "step": 4053 }, { "epoch": 0.11, "learning_rate": 1.966036386214946e-05, "loss": 1.8423, "step": 4054 }, { "epoch": 0.11, "learning_rate": 1.9660135262326674e-05, "loss": 1.5408, "step": 4055 }, { "epoch": 0.11, "learning_rate": 1.965990658692753e-05, "loss": 1.4578, "step": 4056 }, { "epoch": 0.11, "learning_rate": 1.9659677835953822e-05, "loss": 1.4807, "step": 4057 }, { "epoch": 0.11, "learning_rate": 1.9659449009407335e-05, "loss": 1.3003, "step": 4058 }, { "epoch": 0.11, "learning_rate": 1.9659220107289863e-05, "loss": 1.4297, "step": 4059 }, { "epoch": 0.11, "learning_rate": 1.9658991129603195e-05, "loss": 1.5537, "step": 4060 }, { "epoch": 0.11, "learning_rate": 1.965876207634912e-05, "loss": 1.2871, "step": 4061 }, { "epoch": 0.11, "learning_rate": 1.9658532947529435e-05, "loss": 1.2817, "step": 4062 }, { "epoch": 0.11, "learning_rate": 1.9658303743145928e-05, "loss": 1.4785, "step": 4063 }, { "epoch": 0.11, "learning_rate": 1.9658074463200394e-05, "loss": 1.5771, "step": 4064 }, { "epoch": 0.11, "learning_rate": 1.9657845107694625e-05, "loss": 1.3513, "step": 4065 }, { "epoch": 0.11, "learning_rate": 1.965761567663042e-05, "loss": 1.4312, "step": 4066 }, { "epoch": 0.11, "learning_rate": 1.9657386170009573e-05, "loss": 1.3196, "step": 4067 }, { "epoch": 0.11, "learning_rate": 1.9657156587833877e-05, "loss": 1.4204, "step": 4068 }, { "epoch": 0.11, "learning_rate": 1.965692693010513e-05, "loss": 1.4355, "step": 4069 }, { "epoch": 0.11, "learning_rate": 1.9656697196825127e-05, "loss": 1.4839, "step": 4070 }, { "epoch": 0.11, "learning_rate": 1.9656467387995663e-05, "loss": 1.4731, "step": 4071 }, { "epoch": 0.11, "learning_rate": 1.965623750361854e-05, "loss": 1.2888, "step": 4072 }, { "epoch": 0.11, "learning_rate": 1.9656007543695557e-05, "loss": 1.4424, "step": 4073 }, { "epoch": 0.11, "learning_rate": 1.965577750822851e-05, "loss": 1.2834, "step": 4074 }, { "epoch": 0.11, "learning_rate": 1.9655547397219198e-05, "loss": 1.2896, "step": 4075 }, { "epoch": 0.11, "learning_rate": 1.9655317210669428e-05, "loss": 1.366, "step": 4076 }, { "epoch": 0.11, "learning_rate": 1.9655086948580996e-05, "loss": 1.4287, "step": 4077 }, { "epoch": 0.11, "learning_rate": 1.96548566109557e-05, "loss": 1.4595, "step": 4078 }, { "epoch": 0.11, "learning_rate": 1.965462619779535e-05, "loss": 1.3749, "step": 4079 }, { "epoch": 0.11, "learning_rate": 1.9654395709101742e-05, "loss": 1.4041, "step": 4080 }, { "epoch": 0.11, "learning_rate": 1.9654165144876685e-05, "loss": 1.5598, "step": 4081 }, { "epoch": 0.11, "learning_rate": 1.9653934505121977e-05, "loss": 1.3638, "step": 4082 }, { "epoch": 0.11, "learning_rate": 1.9653703789839425e-05, "loss": 1.4156, "step": 4083 }, { "epoch": 0.11, "learning_rate": 1.9653472999030835e-05, "loss": 1.4053, "step": 4084 }, { "epoch": 0.11, "learning_rate": 1.9653242132698013e-05, "loss": 1.4934, "step": 4085 }, { "epoch": 0.11, "learning_rate": 1.965301119084276e-05, "loss": 1.7598, "step": 4086 }, { "epoch": 0.11, "learning_rate": 1.965278017346689e-05, "loss": 1.4976, "step": 4087 }, { "epoch": 0.11, "learning_rate": 1.9652549080572206e-05, "loss": 1.5576, "step": 4088 }, { "epoch": 0.11, "learning_rate": 1.9652317912160516e-05, "loss": 1.4133, "step": 4089 }, { "epoch": 0.11, "learning_rate": 1.965208666823363e-05, "loss": 1.4971, "step": 4090 }, { "epoch": 0.11, "learning_rate": 1.965185534879336e-05, "loss": 1.5259, "step": 4091 }, { "epoch": 0.11, "learning_rate": 1.9651623953841508e-05, "loss": 1.5156, "step": 4092 }, { "epoch": 0.11, "learning_rate": 1.9651392483379888e-05, "loss": 1.5903, "step": 4093 }, { "epoch": 0.11, "learning_rate": 1.9651160937410316e-05, "loss": 1.5017, "step": 4094 }, { "epoch": 0.11, "learning_rate": 1.9650929315934593e-05, "loss": 1.5664, "step": 4095 }, { "epoch": 0.11, "learning_rate": 1.965069761895454e-05, "loss": 1.5576, "step": 4096 }, { "epoch": 0.11, "learning_rate": 1.965046584647197e-05, "loss": 1.3328, "step": 4097 }, { "epoch": 0.11, "learning_rate": 1.9650233998488693e-05, "loss": 1.4146, "step": 4098 }, { "epoch": 0.11, "learning_rate": 1.965000207500652e-05, "loss": 1.4575, "step": 4099 }, { "epoch": 0.11, "learning_rate": 1.964977007602727e-05, "loss": 1.3992, "step": 4100 }, { "epoch": 0.11, "learning_rate": 1.9649538001552753e-05, "loss": 1.4268, "step": 4101 }, { "epoch": 0.11, "learning_rate": 1.9649305851584796e-05, "loss": 1.5488, "step": 4102 }, { "epoch": 0.11, "learning_rate": 1.96490736261252e-05, "loss": 1.5938, "step": 4103 }, { "epoch": 0.11, "learning_rate": 1.9648841325175792e-05, "loss": 1.3193, "step": 4104 }, { "epoch": 0.11, "learning_rate": 1.9648608948738384e-05, "loss": 1.3521, "step": 4105 }, { "epoch": 0.11, "learning_rate": 1.9648376496814803e-05, "loss": 1.5342, "step": 4106 }, { "epoch": 0.11, "learning_rate": 1.9648143969406857e-05, "loss": 1.5312, "step": 4107 }, { "epoch": 0.11, "learning_rate": 1.964791136651637e-05, "loss": 1.5068, "step": 4108 }, { "epoch": 0.11, "learning_rate": 1.9647678688145163e-05, "loss": 1.3491, "step": 4109 }, { "epoch": 0.11, "learning_rate": 1.964744593429505e-05, "loss": 1.3179, "step": 4110 }, { "epoch": 0.11, "learning_rate": 1.9647213104967863e-05, "loss": 1.532, "step": 4111 }, { "epoch": 0.11, "learning_rate": 1.964698020016541e-05, "loss": 1.2417, "step": 4112 }, { "epoch": 0.11, "learning_rate": 1.9646747219889524e-05, "loss": 1.6167, "step": 4113 }, { "epoch": 0.11, "learning_rate": 1.9646514164142023e-05, "loss": 1.4734, "step": 4114 }, { "epoch": 0.11, "learning_rate": 1.9646281032924733e-05, "loss": 1.5498, "step": 4115 }, { "epoch": 0.11, "learning_rate": 1.9646047826239477e-05, "loss": 1.5386, "step": 4116 }, { "epoch": 0.11, "learning_rate": 1.9645814544088076e-05, "loss": 1.5044, "step": 4117 }, { "epoch": 0.11, "learning_rate": 1.964558118647236e-05, "loss": 1.5002, "step": 4118 }, { "epoch": 0.11, "learning_rate": 1.964534775339415e-05, "loss": 1.1912, "step": 4119 }, { "epoch": 0.11, "learning_rate": 1.9645114244855278e-05, "loss": 1.3037, "step": 4120 }, { "epoch": 0.11, "learning_rate": 1.9644880660857563e-05, "loss": 1.3472, "step": 4121 }, { "epoch": 0.11, "learning_rate": 1.9644647001402843e-05, "loss": 1.4009, "step": 4122 }, { "epoch": 0.11, "learning_rate": 1.9644413266492933e-05, "loss": 1.4143, "step": 4123 }, { "epoch": 0.11, "learning_rate": 1.964417945612967e-05, "loss": 1.564, "step": 4124 }, { "epoch": 0.11, "learning_rate": 1.9643945570314886e-05, "loss": 1.4556, "step": 4125 }, { "epoch": 0.11, "learning_rate": 1.9643711609050407e-05, "loss": 1.4819, "step": 4126 }, { "epoch": 0.11, "learning_rate": 1.964347757233806e-05, "loss": 1.4495, "step": 4127 }, { "epoch": 0.11, "learning_rate": 1.964324346017968e-05, "loss": 1.2412, "step": 4128 }, { "epoch": 0.11, "learning_rate": 1.96430092725771e-05, "loss": 1.4995, "step": 4129 }, { "epoch": 0.11, "learning_rate": 1.9642775009532146e-05, "loss": 1.5073, "step": 4130 }, { "epoch": 0.11, "learning_rate": 1.964254067104666e-05, "loss": 1.4014, "step": 4131 }, { "epoch": 0.11, "learning_rate": 1.9642306257122465e-05, "loss": 1.4739, "step": 4132 }, { "epoch": 0.11, "learning_rate": 1.96420717677614e-05, "loss": 1.2573, "step": 4133 }, { "epoch": 0.11, "learning_rate": 1.9641837202965303e-05, "loss": 1.4336, "step": 4134 }, { "epoch": 0.11, "learning_rate": 1.9641602562736005e-05, "loss": 1.4956, "step": 4135 }, { "epoch": 0.11, "learning_rate": 1.964136784707534e-05, "loss": 1.3977, "step": 4136 }, { "epoch": 0.11, "learning_rate": 1.964113305598515e-05, "loss": 1.2112, "step": 4137 }, { "epoch": 0.11, "learning_rate": 1.9640898189467265e-05, "loss": 1.4148, "step": 4138 }, { "epoch": 0.11, "learning_rate": 1.9640663247523527e-05, "loss": 1.5735, "step": 4139 }, { "epoch": 0.11, "learning_rate": 1.9640428230155775e-05, "loss": 1.3801, "step": 4140 }, { "epoch": 0.11, "learning_rate": 1.9640193137365843e-05, "loss": 1.4365, "step": 4141 }, { "epoch": 0.11, "learning_rate": 1.9639957969155573e-05, "loss": 1.4395, "step": 4142 }, { "epoch": 0.11, "learning_rate": 1.9639722725526807e-05, "loss": 1.5005, "step": 4143 }, { "epoch": 0.11, "learning_rate": 1.9639487406481382e-05, "loss": 1.4451, "step": 4144 }, { "epoch": 0.11, "learning_rate": 1.9639252012021145e-05, "loss": 1.9512, "step": 4145 }, { "epoch": 0.11, "learning_rate": 1.9639016542147927e-05, "loss": 1.5107, "step": 4146 }, { "epoch": 0.11, "learning_rate": 1.9638780996863576e-05, "loss": 1.5669, "step": 4147 }, { "epoch": 0.11, "learning_rate": 1.963854537616994e-05, "loss": 1.4209, "step": 4148 }, { "epoch": 0.11, "learning_rate": 1.963830968006885e-05, "loss": 1.5156, "step": 4149 }, { "epoch": 0.11, "learning_rate": 1.9638073908562166e-05, "loss": 1.2583, "step": 4150 }, { "epoch": 0.11, "learning_rate": 1.963783806165172e-05, "loss": 1.4231, "step": 4151 }, { "epoch": 0.11, "learning_rate": 1.9637602139339358e-05, "loss": 1.4465, "step": 4152 }, { "epoch": 0.11, "learning_rate": 1.963736614162693e-05, "loss": 1.3457, "step": 4153 }, { "epoch": 0.11, "learning_rate": 1.9637130068516286e-05, "loss": 1.8164, "step": 4154 }, { "epoch": 0.11, "learning_rate": 1.9636893920009263e-05, "loss": 1.325, "step": 4155 }, { "epoch": 0.11, "learning_rate": 1.9636657696107716e-05, "loss": 1.3901, "step": 4156 }, { "epoch": 0.11, "learning_rate": 1.963642139681349e-05, "loss": 1.3865, "step": 4157 }, { "epoch": 0.11, "learning_rate": 1.9636185022128433e-05, "loss": 1.5525, "step": 4158 }, { "epoch": 0.11, "learning_rate": 1.9635948572054398e-05, "loss": 1.5178, "step": 4159 }, { "epoch": 0.11, "learning_rate": 1.9635712046593228e-05, "loss": 1.4578, "step": 4160 }, { "epoch": 0.11, "learning_rate": 1.9635475445746786e-05, "loss": 1.4741, "step": 4161 }, { "epoch": 0.11, "learning_rate": 1.963523876951691e-05, "loss": 1.5205, "step": 4162 }, { "epoch": 0.11, "learning_rate": 1.9635002017905456e-05, "loss": 1.4741, "step": 4163 }, { "epoch": 0.11, "learning_rate": 1.963476519091428e-05, "loss": 1.4397, "step": 4164 }, { "epoch": 0.11, "learning_rate": 1.9634528288545226e-05, "loss": 1.5332, "step": 4165 }, { "epoch": 0.11, "learning_rate": 1.9634291310800158e-05, "loss": 1.2993, "step": 4166 }, { "epoch": 0.11, "learning_rate": 1.9634054257680924e-05, "loss": 1.4272, "step": 4167 }, { "epoch": 0.11, "learning_rate": 1.963381712918938e-05, "loss": 1.4062, "step": 4168 }, { "epoch": 0.11, "learning_rate": 1.963357992532738e-05, "loss": 1.4268, "step": 4169 }, { "epoch": 0.11, "learning_rate": 1.963334264609678e-05, "loss": 1.335, "step": 4170 }, { "epoch": 0.11, "learning_rate": 1.963310529149944e-05, "loss": 1.3867, "step": 4171 }, { "epoch": 0.11, "learning_rate": 1.963286786153721e-05, "loss": 1.2585, "step": 4172 }, { "epoch": 0.11, "learning_rate": 1.9632630356211955e-05, "loss": 1.4629, "step": 4173 }, { "epoch": 0.11, "learning_rate": 1.9632392775525528e-05, "loss": 1.4856, "step": 4174 }, { "epoch": 0.11, "learning_rate": 1.9632155119479793e-05, "loss": 1.4072, "step": 4175 }, { "epoch": 0.11, "learning_rate": 1.96319173880766e-05, "loss": 1.3494, "step": 4176 }, { "epoch": 0.11, "learning_rate": 1.9631679581317817e-05, "loss": 1.3943, "step": 4177 }, { "epoch": 0.11, "learning_rate": 1.9631441699205303e-05, "loss": 1.3071, "step": 4178 }, { "epoch": 0.11, "learning_rate": 1.963120374174092e-05, "loss": 1.4736, "step": 4179 }, { "epoch": 0.11, "learning_rate": 1.9630965708926522e-05, "loss": 1.416, "step": 4180 }, { "epoch": 0.11, "learning_rate": 1.9630727600763978e-05, "loss": 1.5283, "step": 4181 }, { "epoch": 0.11, "learning_rate": 1.9630489417255156e-05, "loss": 1.5706, "step": 4182 }, { "epoch": 0.11, "learning_rate": 1.963025115840191e-05, "loss": 1.4304, "step": 4183 }, { "epoch": 0.11, "learning_rate": 1.9630012824206107e-05, "loss": 1.5459, "step": 4184 }, { "epoch": 0.11, "learning_rate": 1.9629774414669613e-05, "loss": 1.2769, "step": 4185 }, { "epoch": 0.11, "learning_rate": 1.962953592979429e-05, "loss": 1.325, "step": 4186 }, { "epoch": 0.11, "learning_rate": 1.9629297369582007e-05, "loss": 1.4524, "step": 4187 }, { "epoch": 0.11, "learning_rate": 1.962905873403463e-05, "loss": 1.4795, "step": 4188 }, { "epoch": 0.11, "learning_rate": 1.9628820023154024e-05, "loss": 1.4131, "step": 4189 }, { "epoch": 0.11, "learning_rate": 1.962858123694206e-05, "loss": 1.4487, "step": 4190 }, { "epoch": 0.11, "learning_rate": 1.9628342375400602e-05, "loss": 1.439, "step": 4191 }, { "epoch": 0.11, "learning_rate": 1.9628103438531523e-05, "loss": 1.5093, "step": 4192 }, { "epoch": 0.11, "learning_rate": 1.962786442633669e-05, "loss": 1.7231, "step": 4193 }, { "epoch": 0.11, "learning_rate": 1.962762533881797e-05, "loss": 1.4263, "step": 4194 }, { "epoch": 0.11, "learning_rate": 1.962738617597724e-05, "loss": 1.5908, "step": 4195 }, { "epoch": 0.11, "learning_rate": 1.9627146937816366e-05, "loss": 1.387, "step": 4196 }, { "epoch": 0.11, "learning_rate": 1.962690762433722e-05, "loss": 1.3616, "step": 4197 }, { "epoch": 0.11, "learning_rate": 1.962666823554168e-05, "loss": 1.4766, "step": 4198 }, { "epoch": 0.11, "learning_rate": 1.962642877143161e-05, "loss": 1.4226, "step": 4199 }, { "epoch": 0.11, "learning_rate": 1.9626189232008892e-05, "loss": 1.4692, "step": 4200 }, { "epoch": 0.11, "learning_rate": 1.962594961727539e-05, "loss": 1.3767, "step": 4201 }, { "epoch": 0.11, "learning_rate": 1.9625709927232993e-05, "loss": 1.4666, "step": 4202 }, { "epoch": 0.11, "learning_rate": 1.9625470161883563e-05, "loss": 1.314, "step": 4203 }, { "epoch": 0.11, "learning_rate": 1.962523032122898e-05, "loss": 1.5391, "step": 4204 }, { "epoch": 0.11, "learning_rate": 1.962499040527112e-05, "loss": 1.3472, "step": 4205 }, { "epoch": 0.11, "learning_rate": 1.9624750414011865e-05, "loss": 1.3408, "step": 4206 }, { "epoch": 0.11, "learning_rate": 1.9624510347453087e-05, "loss": 1.3691, "step": 4207 }, { "epoch": 0.11, "learning_rate": 1.9624270205596664e-05, "loss": 1.3633, "step": 4208 }, { "epoch": 0.11, "learning_rate": 1.962402998844448e-05, "loss": 1.3989, "step": 4209 }, { "epoch": 0.11, "learning_rate": 1.9623789695998408e-05, "loss": 1.406, "step": 4210 }, { "epoch": 0.11, "learning_rate": 1.962354932826033e-05, "loss": 1.4944, "step": 4211 }, { "epoch": 0.12, "learning_rate": 1.962330888523213e-05, "loss": 1.3367, "step": 4212 }, { "epoch": 0.12, "learning_rate": 1.9623068366915687e-05, "loss": 1.3948, "step": 4213 }, { "epoch": 0.12, "learning_rate": 1.962282777331288e-05, "loss": 1.4048, "step": 4214 }, { "epoch": 0.12, "learning_rate": 1.9622587104425595e-05, "loss": 1.3745, "step": 4215 }, { "epoch": 0.12, "learning_rate": 1.9622346360255712e-05, "loss": 1.9043, "step": 4216 }, { "epoch": 0.12, "learning_rate": 1.9622105540805116e-05, "loss": 1.3555, "step": 4217 }, { "epoch": 0.12, "learning_rate": 1.9621864646075696e-05, "loss": 1.6001, "step": 4218 }, { "epoch": 0.12, "learning_rate": 1.9621623676069323e-05, "loss": 1.4116, "step": 4219 }, { "epoch": 0.12, "learning_rate": 1.9621382630787895e-05, "loss": 1.4211, "step": 4220 }, { "epoch": 0.12, "learning_rate": 1.9621141510233294e-05, "loss": 1.75, "step": 4221 }, { "epoch": 0.12, "learning_rate": 1.9620900314407406e-05, "loss": 1.3235, "step": 4222 }, { "epoch": 0.12, "learning_rate": 1.962065904331212e-05, "loss": 1.2517, "step": 4223 }, { "epoch": 0.12, "learning_rate": 1.9620417696949316e-05, "loss": 1.4688, "step": 4224 }, { "epoch": 0.12, "learning_rate": 1.962017627532089e-05, "loss": 1.3267, "step": 4225 }, { "epoch": 0.12, "learning_rate": 1.961993477842873e-05, "loss": 1.4368, "step": 4226 }, { "epoch": 0.12, "learning_rate": 1.9619693206274724e-05, "loss": 1.511, "step": 4227 }, { "epoch": 0.12, "learning_rate": 1.961945155886076e-05, "loss": 1.408, "step": 4228 }, { "epoch": 0.12, "learning_rate": 1.961920983618873e-05, "loss": 1.4487, "step": 4229 }, { "epoch": 0.12, "learning_rate": 1.9618968038260528e-05, "loss": 1.521, "step": 4230 }, { "epoch": 0.12, "learning_rate": 1.961872616507804e-05, "loss": 1.2815, "step": 4231 }, { "epoch": 0.12, "learning_rate": 1.961848421664317e-05, "loss": 1.4492, "step": 4232 }, { "epoch": 0.12, "learning_rate": 1.961824219295779e-05, "loss": 1.5977, "step": 4233 }, { "epoch": 0.12, "learning_rate": 1.9618000094023816e-05, "loss": 1.5381, "step": 4234 }, { "epoch": 0.12, "learning_rate": 1.9617757919843126e-05, "loss": 1.4353, "step": 4235 }, { "epoch": 0.12, "learning_rate": 1.961751567041762e-05, "loss": 1.2742, "step": 4236 }, { "epoch": 0.12, "learning_rate": 1.96172733457492e-05, "loss": 1.5698, "step": 4237 }, { "epoch": 0.12, "learning_rate": 1.961703094583975e-05, "loss": 1.3657, "step": 4238 }, { "epoch": 0.12, "learning_rate": 1.9616788470691176e-05, "loss": 1.4326, "step": 4239 }, { "epoch": 0.12, "learning_rate": 1.961654592030537e-05, "loss": 1.3713, "step": 4240 }, { "epoch": 0.12, "learning_rate": 1.9616303294684228e-05, "loss": 1.4004, "step": 4241 }, { "epoch": 0.12, "learning_rate": 1.9616060593829657e-05, "loss": 1.5869, "step": 4242 }, { "epoch": 0.12, "learning_rate": 1.9615817817743543e-05, "loss": 1.4912, "step": 4243 }, { "epoch": 0.12, "learning_rate": 1.9615574966427796e-05, "loss": 1.3547, "step": 4244 }, { "epoch": 0.12, "learning_rate": 1.961533203988431e-05, "loss": 1.4678, "step": 4245 }, { "epoch": 0.12, "learning_rate": 1.961508903811499e-05, "loss": 1.4805, "step": 4246 }, { "epoch": 0.12, "learning_rate": 1.961484596112173e-05, "loss": 1.3584, "step": 4247 }, { "epoch": 0.12, "learning_rate": 1.961460280890644e-05, "loss": 1.5288, "step": 4248 }, { "epoch": 0.12, "learning_rate": 1.961435958147102e-05, "loss": 1.4336, "step": 4249 }, { "epoch": 0.12, "learning_rate": 1.961411627881737e-05, "loss": 1.3789, "step": 4250 }, { "epoch": 0.12, "learning_rate": 1.9613872900947396e-05, "loss": 1.521, "step": 4251 }, { "epoch": 0.12, "learning_rate": 1.9613629447863e-05, "loss": 1.8516, "step": 4252 }, { "epoch": 0.12, "learning_rate": 1.961338591956609e-05, "loss": 1.8335, "step": 4253 }, { "epoch": 0.12, "learning_rate": 1.9613142316058566e-05, "loss": 1.4458, "step": 4254 }, { "epoch": 0.12, "learning_rate": 1.9612898637342336e-05, "loss": 1.4717, "step": 4255 }, { "epoch": 0.12, "learning_rate": 1.961265488341931e-05, "loss": 1.5215, "step": 4256 }, { "epoch": 0.12, "learning_rate": 1.9612411054291392e-05, "loss": 1.4314, "step": 4257 }, { "epoch": 0.12, "learning_rate": 1.961216714996049e-05, "loss": 1.386, "step": 4258 }, { "epoch": 0.12, "learning_rate": 1.961192317042851e-05, "loss": 1.3838, "step": 4259 }, { "epoch": 0.12, "learning_rate": 1.9611679115697365e-05, "loss": 1.3075, "step": 4260 }, { "epoch": 0.12, "learning_rate": 1.961143498576896e-05, "loss": 1.3667, "step": 4261 }, { "epoch": 0.12, "learning_rate": 1.9611190780645214e-05, "loss": 1.4429, "step": 4262 }, { "epoch": 0.12, "learning_rate": 1.9610946500328025e-05, "loss": 1.3647, "step": 4263 }, { "epoch": 0.12, "learning_rate": 1.961070214481931e-05, "loss": 1.4399, "step": 4264 }, { "epoch": 0.12, "learning_rate": 1.9610457714120983e-05, "loss": 1.4937, "step": 4265 }, { "epoch": 0.12, "learning_rate": 1.9610213208234955e-05, "loss": 1.3235, "step": 4266 }, { "epoch": 0.12, "learning_rate": 1.9609968627163133e-05, "loss": 1.3542, "step": 4267 }, { "epoch": 0.12, "learning_rate": 1.960972397090744e-05, "loss": 1.5591, "step": 4268 }, { "epoch": 0.12, "learning_rate": 1.9609479239469785e-05, "loss": 1.4434, "step": 4269 }, { "epoch": 0.12, "learning_rate": 1.960923443285208e-05, "loss": 1.5054, "step": 4270 }, { "epoch": 0.12, "learning_rate": 1.9608989551056245e-05, "loss": 1.5037, "step": 4271 }, { "epoch": 0.12, "learning_rate": 1.9608744594084194e-05, "loss": 1.4709, "step": 4272 }, { "epoch": 0.12, "learning_rate": 1.9608499561937847e-05, "loss": 1.3171, "step": 4273 }, { "epoch": 0.12, "learning_rate": 1.9608254454619114e-05, "loss": 1.3511, "step": 4274 }, { "epoch": 0.12, "learning_rate": 1.9608009272129918e-05, "loss": 1.5117, "step": 4275 }, { "epoch": 0.12, "learning_rate": 1.9607764014472175e-05, "loss": 1.3823, "step": 4276 }, { "epoch": 0.12, "learning_rate": 1.9607518681647803e-05, "loss": 1.584, "step": 4277 }, { "epoch": 0.12, "learning_rate": 1.960727327365872e-05, "loss": 1.4397, "step": 4278 }, { "epoch": 0.12, "learning_rate": 1.9607027790506855e-05, "loss": 1.5095, "step": 4279 }, { "epoch": 0.12, "learning_rate": 1.9606782232194117e-05, "loss": 1.5247, "step": 4280 }, { "epoch": 0.12, "learning_rate": 1.9606536598722435e-05, "loss": 1.4614, "step": 4281 }, { "epoch": 0.12, "learning_rate": 1.960629089009373e-05, "loss": 1.3796, "step": 4282 }, { "epoch": 0.12, "learning_rate": 1.9606045106309917e-05, "loss": 1.5161, "step": 4283 }, { "epoch": 0.12, "learning_rate": 1.9605799247372928e-05, "loss": 1.4316, "step": 4284 }, { "epoch": 0.12, "learning_rate": 1.9605553313284682e-05, "loss": 1.5283, "step": 4285 }, { "epoch": 0.12, "learning_rate": 1.96053073040471e-05, "loss": 1.4688, "step": 4286 }, { "epoch": 0.12, "learning_rate": 1.9605061219662114e-05, "loss": 1.3125, "step": 4287 }, { "epoch": 0.12, "learning_rate": 1.9604815060131645e-05, "loss": 1.415, "step": 4288 }, { "epoch": 0.12, "learning_rate": 1.9604568825457623e-05, "loss": 1.3809, "step": 4289 }, { "epoch": 0.12, "learning_rate": 1.9604322515641964e-05, "loss": 1.4604, "step": 4290 }, { "epoch": 0.12, "learning_rate": 1.9604076130686608e-05, "loss": 1.5435, "step": 4291 }, { "epoch": 0.12, "learning_rate": 1.9603829670593473e-05, "loss": 1.4761, "step": 4292 }, { "epoch": 0.12, "learning_rate": 1.960358313536449e-05, "loss": 1.5942, "step": 4293 }, { "epoch": 0.12, "learning_rate": 1.9603336525001593e-05, "loss": 1.5718, "step": 4294 }, { "epoch": 0.12, "learning_rate": 1.9603089839506702e-05, "loss": 1.5439, "step": 4295 }, { "epoch": 0.12, "learning_rate": 1.960284307888175e-05, "loss": 1.2983, "step": 4296 }, { "epoch": 0.12, "learning_rate": 1.9602596243128675e-05, "loss": 1.3354, "step": 4297 }, { "epoch": 0.12, "learning_rate": 1.9602349332249403e-05, "loss": 1.4678, "step": 4298 }, { "epoch": 0.12, "learning_rate": 1.960210234624586e-05, "loss": 1.4712, "step": 4299 }, { "epoch": 0.12, "learning_rate": 1.9601855285119987e-05, "loss": 1.4478, "step": 4300 }, { "epoch": 0.12, "learning_rate": 1.9601608148873712e-05, "loss": 1.4751, "step": 4301 }, { "epoch": 0.12, "learning_rate": 1.9601360937508974e-05, "loss": 1.4731, "step": 4302 }, { "epoch": 0.12, "learning_rate": 1.9601113651027697e-05, "loss": 1.6118, "step": 4303 }, { "epoch": 0.12, "learning_rate": 1.9600866289431823e-05, "loss": 1.4243, "step": 4304 }, { "epoch": 0.12, "learning_rate": 1.9600618852723287e-05, "loss": 1.3318, "step": 4305 }, { "epoch": 0.12, "learning_rate": 1.9600371340904022e-05, "loss": 1.5776, "step": 4306 }, { "epoch": 0.12, "learning_rate": 1.9600123753975968e-05, "loss": 1.481, "step": 4307 }, { "epoch": 0.12, "learning_rate": 1.959987609194106e-05, "loss": 1.4795, "step": 4308 }, { "epoch": 0.12, "learning_rate": 1.9599628354801235e-05, "loss": 1.0126, "step": 4309 }, { "epoch": 0.12, "learning_rate": 1.9599380542558433e-05, "loss": 1.333, "step": 4310 }, { "epoch": 0.12, "learning_rate": 1.959913265521459e-05, "loss": 1.3618, "step": 4311 }, { "epoch": 0.12, "learning_rate": 1.959888469277165e-05, "loss": 1.5083, "step": 4312 }, { "epoch": 0.12, "learning_rate": 1.9598636655231543e-05, "loss": 1.2612, "step": 4313 }, { "epoch": 0.12, "learning_rate": 1.959838854259622e-05, "loss": 1.6406, "step": 4314 }, { "epoch": 0.12, "learning_rate": 1.959814035486762e-05, "loss": 1.4824, "step": 4315 }, { "epoch": 0.12, "learning_rate": 1.9597892092047683e-05, "loss": 1.4026, "step": 4316 }, { "epoch": 0.12, "learning_rate": 1.959764375413835e-05, "loss": 1.3491, "step": 4317 }, { "epoch": 0.12, "learning_rate": 1.9597395341141567e-05, "loss": 1.48, "step": 4318 }, { "epoch": 0.12, "learning_rate": 1.9597146853059273e-05, "loss": 1.4314, "step": 4319 }, { "epoch": 0.12, "learning_rate": 1.9596898289893418e-05, "loss": 1.4417, "step": 4320 }, { "epoch": 0.12, "learning_rate": 1.9596649651645942e-05, "loss": 1.4478, "step": 4321 }, { "epoch": 0.12, "learning_rate": 1.959640093831879e-05, "loss": 1.3352, "step": 4322 }, { "epoch": 0.12, "learning_rate": 1.9596152149913914e-05, "loss": 1.4512, "step": 4323 }, { "epoch": 0.12, "learning_rate": 1.9595903286433256e-05, "loss": 1.3862, "step": 4324 }, { "epoch": 0.12, "learning_rate": 1.959565434787876e-05, "loss": 1.5024, "step": 4325 }, { "epoch": 0.12, "learning_rate": 1.9595405334252377e-05, "loss": 1.4395, "step": 4326 }, { "epoch": 0.12, "learning_rate": 1.9595156245556056e-05, "loss": 1.4702, "step": 4327 }, { "epoch": 0.12, "learning_rate": 1.9594907081791745e-05, "loss": 1.4995, "step": 4328 }, { "epoch": 0.12, "learning_rate": 1.9594657842961388e-05, "loss": 1.49, "step": 4329 }, { "epoch": 0.12, "learning_rate": 1.9594408529066945e-05, "loss": 1.3687, "step": 4330 }, { "epoch": 0.12, "learning_rate": 1.9594159140110356e-05, "loss": 1.5205, "step": 4331 }, { "epoch": 0.12, "learning_rate": 1.9593909676093584e-05, "loss": 1.3481, "step": 4332 }, { "epoch": 0.12, "learning_rate": 1.959366013701857e-05, "loss": 1.5791, "step": 4333 }, { "epoch": 0.12, "learning_rate": 1.9593410522887274e-05, "loss": 1.834, "step": 4334 }, { "epoch": 0.12, "learning_rate": 1.9593160833701643e-05, "loss": 1.3672, "step": 4335 }, { "epoch": 0.12, "learning_rate": 1.959291106946363e-05, "loss": 1.4797, "step": 4336 }, { "epoch": 0.12, "learning_rate": 1.9592661230175192e-05, "loss": 1.5859, "step": 4337 }, { "epoch": 0.12, "learning_rate": 1.959241131583829e-05, "loss": 1.4971, "step": 4338 }, { "epoch": 0.12, "learning_rate": 1.9592161326454865e-05, "loss": 1.4631, "step": 4339 }, { "epoch": 0.12, "learning_rate": 1.9591911262026882e-05, "loss": 1.4709, "step": 4340 }, { "epoch": 0.12, "learning_rate": 1.9591661122556297e-05, "loss": 1.3425, "step": 4341 }, { "epoch": 0.12, "learning_rate": 1.9591410908045067e-05, "loss": 1.5337, "step": 4342 }, { "epoch": 0.12, "learning_rate": 1.9591160618495147e-05, "loss": 1.5156, "step": 4343 }, { "epoch": 0.12, "learning_rate": 1.9590910253908493e-05, "loss": 1.6345, "step": 4344 }, { "epoch": 0.12, "learning_rate": 1.9590659814287073e-05, "loss": 1.4099, "step": 4345 }, { "epoch": 0.12, "learning_rate": 1.959040929963284e-05, "loss": 1.3958, "step": 4346 }, { "epoch": 0.12, "learning_rate": 1.9590158709947752e-05, "loss": 1.5239, "step": 4347 }, { "epoch": 0.12, "learning_rate": 1.958990804523377e-05, "loss": 1.4521, "step": 4348 }, { "epoch": 0.12, "learning_rate": 1.9589657305492857e-05, "loss": 1.4707, "step": 4349 }, { "epoch": 0.12, "learning_rate": 1.958940649072698e-05, "loss": 1.5303, "step": 4350 }, { "epoch": 0.12, "learning_rate": 1.958915560093809e-05, "loss": 1.4448, "step": 4351 }, { "epoch": 0.12, "learning_rate": 1.958890463612816e-05, "loss": 1.5562, "step": 4352 }, { "epoch": 0.12, "learning_rate": 1.958865359629915e-05, "loss": 1.5227, "step": 4353 }, { "epoch": 0.12, "learning_rate": 1.9588402481453018e-05, "loss": 1.4744, "step": 4354 }, { "epoch": 0.12, "learning_rate": 1.9588151291591735e-05, "loss": 1.4141, "step": 4355 }, { "epoch": 0.12, "learning_rate": 1.9587900026717265e-05, "loss": 1.4575, "step": 4356 }, { "epoch": 0.12, "learning_rate": 1.9587648686831576e-05, "loss": 1.4563, "step": 4357 }, { "epoch": 0.12, "learning_rate": 1.958739727193663e-05, "loss": 1.4492, "step": 4358 }, { "epoch": 0.12, "learning_rate": 1.95871457820344e-05, "loss": 1.3892, "step": 4359 }, { "epoch": 0.12, "learning_rate": 1.9586894217126848e-05, "loss": 1.5464, "step": 4360 }, { "epoch": 0.12, "learning_rate": 1.958664257721594e-05, "loss": 1.4822, "step": 4361 }, { "epoch": 0.12, "learning_rate": 1.958639086230365e-05, "loss": 1.2449, "step": 4362 }, { "epoch": 0.12, "learning_rate": 1.9586139072391947e-05, "loss": 1.4141, "step": 4363 }, { "epoch": 0.12, "learning_rate": 1.95858872074828e-05, "loss": 1.4097, "step": 4364 }, { "epoch": 0.12, "learning_rate": 1.958563526757818e-05, "loss": 1.5132, "step": 4365 }, { "epoch": 0.12, "learning_rate": 1.9585383252680053e-05, "loss": 1.5251, "step": 4366 }, { "epoch": 0.12, "learning_rate": 1.95851311627904e-05, "loss": 1.3259, "step": 4367 }, { "epoch": 0.12, "learning_rate": 1.958487899791118e-05, "loss": 1.5469, "step": 4368 }, { "epoch": 0.12, "learning_rate": 1.9584626758044384e-05, "loss": 1.5171, "step": 4369 }, { "epoch": 0.12, "learning_rate": 1.9584374443191965e-05, "loss": 1.4929, "step": 4370 }, { "epoch": 0.12, "learning_rate": 1.9584122053355914e-05, "loss": 1.458, "step": 4371 }, { "epoch": 0.12, "learning_rate": 1.95838695885382e-05, "loss": 1.4229, "step": 4372 }, { "epoch": 0.12, "learning_rate": 1.9583617048740793e-05, "loss": 1.4436, "step": 4373 }, { "epoch": 0.12, "learning_rate": 1.9583364433965676e-05, "loss": 1.4907, "step": 4374 }, { "epoch": 0.12, "learning_rate": 1.958311174421482e-05, "loss": 1.384, "step": 4375 }, { "epoch": 0.12, "learning_rate": 1.95828589794902e-05, "loss": 1.3806, "step": 4376 }, { "epoch": 0.12, "learning_rate": 1.9582606139793804e-05, "loss": 1.5337, "step": 4377 }, { "epoch": 0.12, "learning_rate": 1.9582353225127604e-05, "loss": 1.4607, "step": 4378 }, { "epoch": 0.12, "learning_rate": 1.9582100235493574e-05, "loss": 1.4358, "step": 4379 }, { "epoch": 0.12, "learning_rate": 1.95818471708937e-05, "loss": 1.4507, "step": 4380 }, { "epoch": 0.12, "learning_rate": 1.958159403132996e-05, "loss": 1.5225, "step": 4381 }, { "epoch": 0.12, "learning_rate": 1.958134081680433e-05, "loss": 1.46, "step": 4382 }, { "epoch": 0.12, "learning_rate": 1.95810875273188e-05, "loss": 1.3748, "step": 4383 }, { "epoch": 0.12, "learning_rate": 1.9580834162875342e-05, "loss": 1.292, "step": 4384 }, { "epoch": 0.12, "learning_rate": 1.9580580723475945e-05, "loss": 1.1804, "step": 4385 }, { "epoch": 0.12, "learning_rate": 1.958032720912259e-05, "loss": 1.3545, "step": 4386 }, { "epoch": 0.12, "learning_rate": 1.958007361981726e-05, "loss": 1.3889, "step": 4387 }, { "epoch": 0.12, "learning_rate": 1.9579819955561938e-05, "loss": 1.458, "step": 4388 }, { "epoch": 0.12, "learning_rate": 1.957956621635861e-05, "loss": 1.3698, "step": 4389 }, { "epoch": 0.12, "learning_rate": 1.957931240220926e-05, "loss": 1.2856, "step": 4390 }, { "epoch": 0.12, "learning_rate": 1.9579058513115875e-05, "loss": 1.4556, "step": 4391 }, { "epoch": 0.12, "learning_rate": 1.957880454908044e-05, "loss": 1.3945, "step": 4392 }, { "epoch": 0.12, "learning_rate": 1.957855051010494e-05, "loss": 1.5425, "step": 4393 }, { "epoch": 0.12, "learning_rate": 1.9578296396191368e-05, "loss": 1.4053, "step": 4394 }, { "epoch": 0.12, "learning_rate": 1.9578042207341708e-05, "loss": 1.5229, "step": 4395 }, { "epoch": 0.12, "learning_rate": 1.9577787943557947e-05, "loss": 1.5522, "step": 4396 }, { "epoch": 0.12, "learning_rate": 1.9577533604842084e-05, "loss": 1.9219, "step": 4397 }, { "epoch": 0.12, "learning_rate": 1.9577279191196098e-05, "loss": 1.3071, "step": 4398 }, { "epoch": 0.12, "learning_rate": 1.957702470262198e-05, "loss": 1.2568, "step": 4399 }, { "epoch": 0.12, "learning_rate": 1.957677013912173e-05, "loss": 1.4971, "step": 4400 }, { "epoch": 0.12, "learning_rate": 1.957651550069733e-05, "loss": 1.3208, "step": 4401 }, { "epoch": 0.12, "learning_rate": 1.9576260787350777e-05, "loss": 1.4089, "step": 4402 }, { "epoch": 0.12, "learning_rate": 1.957600599908406e-05, "loss": 1.5156, "step": 4403 }, { "epoch": 0.12, "learning_rate": 1.9575751135899178e-05, "loss": 1.3707, "step": 4404 }, { "epoch": 0.12, "learning_rate": 1.9575496197798122e-05, "loss": 1.2954, "step": 4405 }, { "epoch": 0.12, "learning_rate": 1.9575241184782884e-05, "loss": 1.8569, "step": 4406 }, { "epoch": 0.12, "learning_rate": 1.9574986096855463e-05, "loss": 1.4148, "step": 4407 }, { "epoch": 0.12, "learning_rate": 1.9574730934017857e-05, "loss": 1.3987, "step": 4408 }, { "epoch": 0.12, "learning_rate": 1.9574475696272052e-05, "loss": 1.3572, "step": 4409 }, { "epoch": 0.12, "learning_rate": 1.9574220383620054e-05, "loss": 1.4578, "step": 4410 }, { "epoch": 0.12, "learning_rate": 1.9573964996063862e-05, "loss": 1.3999, "step": 4411 }, { "epoch": 0.12, "learning_rate": 1.9573709533605464e-05, "loss": 1.3428, "step": 4412 }, { "epoch": 0.12, "learning_rate": 1.9573453996246867e-05, "loss": 1.2964, "step": 4413 }, { "epoch": 0.12, "learning_rate": 1.957319838399007e-05, "loss": 1.5771, "step": 4414 }, { "epoch": 0.12, "learning_rate": 1.9572942696837067e-05, "loss": 1.5356, "step": 4415 }, { "epoch": 0.12, "learning_rate": 1.957268693478986e-05, "loss": 1.4727, "step": 4416 }, { "epoch": 0.12, "learning_rate": 1.9572431097850456e-05, "loss": 1.4663, "step": 4417 }, { "epoch": 0.12, "learning_rate": 1.957217518602085e-05, "loss": 1.426, "step": 4418 }, { "epoch": 0.12, "learning_rate": 1.9571919199303048e-05, "loss": 1.4001, "step": 4419 }, { "epoch": 0.12, "learning_rate": 1.9571663137699053e-05, "loss": 1.4458, "step": 4420 }, { "epoch": 0.12, "learning_rate": 1.9571407001210864e-05, "loss": 1.6626, "step": 4421 }, { "epoch": 0.12, "learning_rate": 1.9571150789840486e-05, "loss": 1.4807, "step": 4422 }, { "epoch": 0.12, "learning_rate": 1.9570894503589926e-05, "loss": 1.4087, "step": 4423 }, { "epoch": 0.12, "learning_rate": 1.957063814246119e-05, "loss": 1.6206, "step": 4424 }, { "epoch": 0.12, "learning_rate": 1.957038170645628e-05, "loss": 1.4741, "step": 4425 }, { "epoch": 0.12, "learning_rate": 1.9570125195577203e-05, "loss": 1.2686, "step": 4426 }, { "epoch": 0.12, "learning_rate": 1.9569868609825968e-05, "loss": 1.4961, "step": 4427 }, { "epoch": 0.12, "learning_rate": 1.956961194920458e-05, "loss": 1.3392, "step": 4428 }, { "epoch": 0.12, "learning_rate": 1.956935521371505e-05, "loss": 1.8208, "step": 4429 }, { "epoch": 0.12, "learning_rate": 1.9569098403359383e-05, "loss": 1.4717, "step": 4430 }, { "epoch": 0.12, "learning_rate": 1.9568841518139588e-05, "loss": 1.3174, "step": 4431 }, { "epoch": 0.12, "learning_rate": 1.956858455805768e-05, "loss": 1.353, "step": 4432 }, { "epoch": 0.12, "learning_rate": 1.9568327523115664e-05, "loss": 1.3398, "step": 4433 }, { "epoch": 0.12, "learning_rate": 1.9568070413315555e-05, "loss": 1.2751, "step": 4434 }, { "epoch": 0.12, "learning_rate": 1.9567813228659358e-05, "loss": 1.5225, "step": 4435 }, { "epoch": 0.12, "learning_rate": 1.9567555969149093e-05, "loss": 1.5217, "step": 4436 }, { "epoch": 0.12, "learning_rate": 1.9567298634786768e-05, "loss": 1.3501, "step": 4437 }, { "epoch": 0.12, "learning_rate": 1.9567041225574398e-05, "loss": 1.5039, "step": 4438 }, { "epoch": 0.12, "learning_rate": 1.9566783741513995e-05, "loss": 1.4504, "step": 4439 }, { "epoch": 0.12, "learning_rate": 1.9566526182607575e-05, "loss": 1.426, "step": 4440 }, { "epoch": 0.12, "learning_rate": 1.956626854885715e-05, "loss": 1.3762, "step": 4441 }, { "epoch": 0.12, "learning_rate": 1.9566010840264743e-05, "loss": 1.459, "step": 4442 }, { "epoch": 0.12, "learning_rate": 1.9565753056832366e-05, "loss": 1.4531, "step": 4443 }, { "epoch": 0.12, "learning_rate": 1.9565495198562033e-05, "loss": 1.5562, "step": 4444 }, { "epoch": 0.12, "learning_rate": 1.956523726545576e-05, "loss": 1.5063, "step": 4445 }, { "epoch": 0.12, "learning_rate": 1.9564979257515576e-05, "loss": 1.2583, "step": 4446 }, { "epoch": 0.12, "learning_rate": 1.9564721174743487e-05, "loss": 1.4639, "step": 4447 }, { "epoch": 0.12, "learning_rate": 1.956446301714152e-05, "loss": 1.3813, "step": 4448 }, { "epoch": 0.12, "learning_rate": 1.9564204784711687e-05, "loss": 1.2852, "step": 4449 }, { "epoch": 0.12, "learning_rate": 1.9563946477456016e-05, "loss": 1.769, "step": 4450 }, { "epoch": 0.12, "learning_rate": 1.9563688095376524e-05, "loss": 1.3975, "step": 4451 }, { "epoch": 0.12, "learning_rate": 1.9563429638475234e-05, "loss": 1.3906, "step": 4452 }, { "epoch": 0.12, "learning_rate": 1.956317110675417e-05, "loss": 1.2515, "step": 4453 }, { "epoch": 0.12, "learning_rate": 1.9562912500215353e-05, "loss": 1.4963, "step": 4454 }, { "epoch": 0.12, "learning_rate": 1.95626538188608e-05, "loss": 1.3726, "step": 4455 }, { "epoch": 0.12, "learning_rate": 1.9562395062692544e-05, "loss": 1.5483, "step": 4456 }, { "epoch": 0.12, "learning_rate": 1.9562136231712604e-05, "loss": 1.1719, "step": 4457 }, { "epoch": 0.12, "learning_rate": 1.9561877325923008e-05, "loss": 1.4282, "step": 4458 }, { "epoch": 0.12, "learning_rate": 1.956161834532578e-05, "loss": 1.4695, "step": 4459 }, { "epoch": 0.12, "learning_rate": 1.9561359289922945e-05, "loss": 1.4697, "step": 4460 }, { "epoch": 0.12, "learning_rate": 1.9561100159716534e-05, "loss": 1.4202, "step": 4461 }, { "epoch": 0.12, "learning_rate": 1.9560840954708565e-05, "loss": 1.4165, "step": 4462 }, { "epoch": 0.12, "learning_rate": 1.956058167490108e-05, "loss": 1.2749, "step": 4463 }, { "epoch": 0.12, "learning_rate": 1.9560322320296093e-05, "loss": 1.5156, "step": 4464 }, { "epoch": 0.12, "learning_rate": 1.9560062890895642e-05, "loss": 1.4626, "step": 4465 }, { "epoch": 0.12, "learning_rate": 1.9559803386701755e-05, "loss": 1.509, "step": 4466 }, { "epoch": 0.12, "learning_rate": 1.9559543807716462e-05, "loss": 1.4194, "step": 4467 }, { "epoch": 0.12, "learning_rate": 1.9559284153941794e-05, "loss": 1.4575, "step": 4468 }, { "epoch": 0.12, "learning_rate": 1.955902442537978e-05, "loss": 1.4819, "step": 4469 }, { "epoch": 0.12, "learning_rate": 1.9558764622032456e-05, "loss": 1.3694, "step": 4470 }, { "epoch": 0.12, "learning_rate": 1.9558504743901848e-05, "loss": 1.4731, "step": 4471 }, { "epoch": 0.12, "learning_rate": 1.955824479099e-05, "loss": 1.4082, "step": 4472 }, { "epoch": 0.12, "learning_rate": 1.9557984763298937e-05, "loss": 1.418, "step": 4473 }, { "epoch": 0.12, "learning_rate": 1.9557724660830694e-05, "loss": 1.3289, "step": 4474 }, { "epoch": 0.12, "learning_rate": 1.9557464483587307e-05, "loss": 1.4224, "step": 4475 }, { "epoch": 0.12, "learning_rate": 1.9557204231570816e-05, "loss": 1.5376, "step": 4476 }, { "epoch": 0.12, "learning_rate": 1.9556943904783247e-05, "loss": 1.5254, "step": 4477 }, { "epoch": 0.12, "learning_rate": 1.9556683503226647e-05, "loss": 1.3955, "step": 4478 }, { "epoch": 0.12, "learning_rate": 1.955642302690305e-05, "loss": 1.4878, "step": 4479 }, { "epoch": 0.12, "learning_rate": 1.9556162475814494e-05, "loss": 1.4702, "step": 4480 }, { "epoch": 0.12, "learning_rate": 1.955590184996301e-05, "loss": 1.438, "step": 4481 }, { "epoch": 0.12, "learning_rate": 1.955564114935065e-05, "loss": 1.3535, "step": 4482 }, { "epoch": 0.12, "learning_rate": 1.9555380373979444e-05, "loss": 1.4082, "step": 4483 }, { "epoch": 0.12, "learning_rate": 1.9555119523851437e-05, "loss": 1.6169, "step": 4484 }, { "epoch": 0.12, "learning_rate": 1.9554858598968666e-05, "loss": 1.2351, "step": 4485 }, { "epoch": 0.12, "learning_rate": 1.9554597599333177e-05, "loss": 1.5562, "step": 4486 }, { "epoch": 0.12, "learning_rate": 1.9554336524947004e-05, "loss": 1.3464, "step": 4487 }, { "epoch": 0.12, "learning_rate": 1.95540753758122e-05, "loss": 1.3911, "step": 4488 }, { "epoch": 0.12, "learning_rate": 1.95538141519308e-05, "loss": 1.5156, "step": 4489 }, { "epoch": 0.12, "learning_rate": 1.955355285330485e-05, "loss": 1.4797, "step": 4490 }, { "epoch": 0.12, "learning_rate": 1.95532914799364e-05, "loss": 1.459, "step": 4491 }, { "epoch": 0.12, "learning_rate": 1.9553030031827486e-05, "loss": 1.5723, "step": 4492 }, { "epoch": 0.12, "learning_rate": 1.955276850898016e-05, "loss": 1.2026, "step": 4493 }, { "epoch": 0.12, "learning_rate": 1.955250691139646e-05, "loss": 1.4524, "step": 4494 }, { "epoch": 0.12, "learning_rate": 1.955224523907844e-05, "loss": 1.4851, "step": 4495 }, { "epoch": 0.12, "learning_rate": 1.9551983492028146e-05, "loss": 1.5916, "step": 4496 }, { "epoch": 0.12, "learning_rate": 1.9551721670247622e-05, "loss": 1.3394, "step": 4497 }, { "epoch": 0.12, "learning_rate": 1.9551459773738924e-05, "loss": 1.4893, "step": 4498 }, { "epoch": 0.12, "learning_rate": 1.9551197802504092e-05, "loss": 1.5239, "step": 4499 }, { "epoch": 0.12, "learning_rate": 1.9550935756545182e-05, "loss": 1.363, "step": 4500 }, { "epoch": 0.12, "learning_rate": 1.955067363586424e-05, "loss": 1.7529, "step": 4501 }, { "epoch": 0.12, "learning_rate": 1.955041144046332e-05, "loss": 1.4692, "step": 4502 }, { "epoch": 0.12, "learning_rate": 1.9550149170344474e-05, "loss": 1.4502, "step": 4503 }, { "epoch": 0.12, "learning_rate": 1.9549886825509748e-05, "loss": 1.3599, "step": 4504 }, { "epoch": 0.12, "learning_rate": 1.95496244059612e-05, "loss": 1.5913, "step": 4505 }, { "epoch": 0.12, "learning_rate": 1.954936191170088e-05, "loss": 1.8486, "step": 4506 }, { "epoch": 0.12, "learning_rate": 1.954909934273084e-05, "loss": 1.3706, "step": 4507 }, { "epoch": 0.12, "learning_rate": 1.954883669905314e-05, "loss": 1.3198, "step": 4508 }, { "epoch": 0.12, "learning_rate": 1.9548573980669837e-05, "loss": 1.5527, "step": 4509 }, { "epoch": 0.12, "learning_rate": 1.9548311187582975e-05, "loss": 1.5488, "step": 4510 }, { "epoch": 0.12, "learning_rate": 1.9548048319794617e-05, "loss": 1.2717, "step": 4511 }, { "epoch": 0.12, "learning_rate": 1.954778537730682e-05, "loss": 1.4041, "step": 4512 }, { "epoch": 0.12, "learning_rate": 1.954752236012164e-05, "loss": 1.4697, "step": 4513 }, { "epoch": 0.12, "learning_rate": 1.9547259268241134e-05, "loss": 1.4438, "step": 4514 }, { "epoch": 0.12, "learning_rate": 1.9546996101667362e-05, "loss": 1.4492, "step": 4515 }, { "epoch": 0.12, "learning_rate": 1.954673286040238e-05, "loss": 1.3379, "step": 4516 }, { "epoch": 0.12, "learning_rate": 1.954646954444825e-05, "loss": 1.5254, "step": 4517 }, { "epoch": 0.12, "learning_rate": 1.954620615380703e-05, "loss": 1.3938, "step": 4518 }, { "epoch": 0.12, "learning_rate": 1.9545942688480784e-05, "loss": 1.5112, "step": 4519 }, { "epoch": 0.12, "learning_rate": 1.954567914847157e-05, "loss": 1.5425, "step": 4520 }, { "epoch": 0.12, "learning_rate": 1.9545415533781453e-05, "loss": 1.5054, "step": 4521 }, { "epoch": 0.12, "learning_rate": 1.954515184441249e-05, "loss": 1.4775, "step": 4522 }, { "epoch": 0.12, "learning_rate": 1.954488808036675e-05, "loss": 1.3652, "step": 4523 }, { "epoch": 0.12, "learning_rate": 1.9544624241646294e-05, "loss": 1.4304, "step": 4524 }, { "epoch": 0.12, "learning_rate": 1.9544360328253185e-05, "loss": 1.4617, "step": 4525 }, { "epoch": 0.12, "learning_rate": 1.9544096340189493e-05, "loss": 1.2893, "step": 4526 }, { "epoch": 0.12, "learning_rate": 1.954383227745727e-05, "loss": 1.3718, "step": 4527 }, { "epoch": 0.12, "learning_rate": 1.9543568140058598e-05, "loss": 1.4878, "step": 4528 }, { "epoch": 0.12, "learning_rate": 1.9543303927995536e-05, "loss": 1.4609, "step": 4529 }, { "epoch": 0.12, "learning_rate": 1.954303964127015e-05, "loss": 1.4746, "step": 4530 }, { "epoch": 0.12, "learning_rate": 1.954277527988451e-05, "loss": 1.3315, "step": 4531 }, { "epoch": 0.12, "learning_rate": 1.9542510843840685e-05, "loss": 1.5715, "step": 4532 }, { "epoch": 0.12, "learning_rate": 1.954224633314074e-05, "loss": 1.4517, "step": 4533 }, { "epoch": 0.12, "learning_rate": 1.954198174778675e-05, "loss": 1.4368, "step": 4534 }, { "epoch": 0.12, "learning_rate": 1.954171708778078e-05, "loss": 1.5117, "step": 4535 }, { "epoch": 0.12, "learning_rate": 1.95414523531249e-05, "loss": 1.542, "step": 4536 }, { "epoch": 0.12, "learning_rate": 1.9541187543821186e-05, "loss": 1.4121, "step": 4537 }, { "epoch": 0.12, "learning_rate": 1.954092265987171e-05, "loss": 1.4385, "step": 4538 }, { "epoch": 0.12, "learning_rate": 1.9540657701278536e-05, "loss": 1.4456, "step": 4539 }, { "epoch": 0.12, "learning_rate": 1.9540392668043744e-05, "loss": 1.5869, "step": 4540 }, { "epoch": 0.12, "learning_rate": 1.9540127560169407e-05, "loss": 1.3442, "step": 4541 }, { "epoch": 0.12, "learning_rate": 1.9539862377657597e-05, "loss": 1.6201, "step": 4542 }, { "epoch": 0.12, "learning_rate": 1.9539597120510393e-05, "loss": 1.4985, "step": 4543 }, { "epoch": 0.12, "learning_rate": 1.9539331788729863e-05, "loss": 1.3887, "step": 4544 }, { "epoch": 0.12, "learning_rate": 1.953906638231809e-05, "loss": 1.4534, "step": 4545 }, { "epoch": 0.12, "learning_rate": 1.953880090127714e-05, "loss": 1.5742, "step": 4546 }, { "epoch": 0.12, "learning_rate": 1.9538535345609106e-05, "loss": 1.354, "step": 4547 }, { "epoch": 0.12, "learning_rate": 1.9538269715316055e-05, "loss": 1.4233, "step": 4548 }, { "epoch": 0.12, "learning_rate": 1.9538004010400063e-05, "loss": 1.3979, "step": 4549 }, { "epoch": 0.12, "learning_rate": 1.9537738230863216e-05, "loss": 1.3818, "step": 4550 }, { "epoch": 0.12, "learning_rate": 1.953747237670759e-05, "loss": 1.436, "step": 4551 }, { "epoch": 0.12, "learning_rate": 1.9537206447935264e-05, "loss": 1.4414, "step": 4552 }, { "epoch": 0.12, "learning_rate": 1.953694044454832e-05, "loss": 1.4736, "step": 4553 }, { "epoch": 0.12, "learning_rate": 1.9536674366548837e-05, "loss": 1.4399, "step": 4554 }, { "epoch": 0.12, "learning_rate": 1.95364082139389e-05, "loss": 1.5569, "step": 4555 }, { "epoch": 0.12, "learning_rate": 1.953614198672059e-05, "loss": 1.408, "step": 4556 }, { "epoch": 0.12, "learning_rate": 1.9535875684895986e-05, "loss": 1.4329, "step": 4557 }, { "epoch": 0.12, "learning_rate": 1.9535609308467178e-05, "loss": 1.3096, "step": 4558 }, { "epoch": 0.12, "learning_rate": 1.9535342857436244e-05, "loss": 1.5166, "step": 4559 }, { "epoch": 0.12, "learning_rate": 1.9535076331805275e-05, "loss": 1.4238, "step": 4560 }, { "epoch": 0.12, "learning_rate": 1.953480973157635e-05, "loss": 1.3062, "step": 4561 }, { "epoch": 0.12, "learning_rate": 1.9534543056751558e-05, "loss": 1.3147, "step": 4562 }, { "epoch": 0.12, "learning_rate": 1.953427630733298e-05, "loss": 1.4136, "step": 4563 }, { "epoch": 0.12, "learning_rate": 1.9534009483322713e-05, "loss": 1.3252, "step": 4564 }, { "epoch": 0.12, "learning_rate": 1.953374258472284e-05, "loss": 1.3667, "step": 4565 }, { "epoch": 0.12, "learning_rate": 1.9533475611535447e-05, "loss": 1.3054, "step": 4566 }, { "epoch": 0.12, "learning_rate": 1.9533208563762622e-05, "loss": 1.4448, "step": 4567 }, { "epoch": 0.12, "learning_rate": 1.9532941441406456e-05, "loss": 1.6763, "step": 4568 }, { "epoch": 0.12, "learning_rate": 1.953267424446904e-05, "loss": 1.4707, "step": 4569 }, { "epoch": 0.12, "learning_rate": 1.953240697295246e-05, "loss": 1.4272, "step": 4570 }, { "epoch": 0.12, "learning_rate": 1.9532139626858814e-05, "loss": 1.3423, "step": 4571 }, { "epoch": 0.12, "learning_rate": 1.953187220619019e-05, "loss": 1.5498, "step": 4572 }, { "epoch": 0.12, "learning_rate": 1.9531604710948677e-05, "loss": 1.3511, "step": 4573 }, { "epoch": 0.12, "learning_rate": 1.9531337141136375e-05, "loss": 1.5535, "step": 4574 }, { "epoch": 0.12, "learning_rate": 1.953106949675537e-05, "loss": 1.2415, "step": 4575 }, { "epoch": 0.12, "learning_rate": 1.953080177780776e-05, "loss": 1.3833, "step": 4576 }, { "epoch": 0.12, "learning_rate": 1.9530533984295638e-05, "loss": 1.4956, "step": 4577 }, { "epoch": 0.13, "learning_rate": 1.95302661162211e-05, "loss": 1.4658, "step": 4578 }, { "epoch": 0.13, "learning_rate": 1.9529998173586242e-05, "loss": 1.4578, "step": 4579 }, { "epoch": 0.13, "learning_rate": 1.952973015639316e-05, "loss": 1.605, "step": 4580 }, { "epoch": 0.13, "learning_rate": 1.9529462064643948e-05, "loss": 1.4695, "step": 4581 }, { "epoch": 0.13, "learning_rate": 1.952919389834071e-05, "loss": 1.4761, "step": 4582 }, { "epoch": 0.13, "learning_rate": 1.9528925657485538e-05, "loss": 1.2546, "step": 4583 }, { "epoch": 0.13, "learning_rate": 1.952865734208053e-05, "loss": 1.5215, "step": 4584 }, { "epoch": 0.13, "learning_rate": 1.952838895212779e-05, "loss": 1.3784, "step": 4585 }, { "epoch": 0.13, "learning_rate": 1.9528120487629416e-05, "loss": 1.4917, "step": 4586 }, { "epoch": 0.13, "learning_rate": 1.9527851948587508e-05, "loss": 1.3999, "step": 4587 }, { "epoch": 0.13, "learning_rate": 1.9527583335004166e-05, "loss": 1.4712, "step": 4588 }, { "epoch": 0.13, "learning_rate": 1.952731464688149e-05, "loss": 1.4932, "step": 4589 }, { "epoch": 0.13, "learning_rate": 1.9527045884221584e-05, "loss": 1.5806, "step": 4590 }, { "epoch": 0.13, "learning_rate": 1.9526777047026556e-05, "loss": 1.5537, "step": 4591 }, { "epoch": 0.13, "learning_rate": 1.95265081352985e-05, "loss": 1.3804, "step": 4592 }, { "epoch": 0.13, "learning_rate": 1.9526239149039523e-05, "loss": 1.4368, "step": 4593 }, { "epoch": 0.13, "learning_rate": 1.9525970088251736e-05, "loss": 1.457, "step": 4594 }, { "epoch": 0.13, "learning_rate": 1.9525700952937234e-05, "loss": 1.6616, "step": 4595 }, { "epoch": 0.13, "learning_rate": 1.9525431743098128e-05, "loss": 1.7808, "step": 4596 }, { "epoch": 0.13, "learning_rate": 1.952516245873652e-05, "loss": 1.2917, "step": 4597 }, { "epoch": 0.13, "learning_rate": 1.9524893099854526e-05, "loss": 1.4746, "step": 4598 }, { "epoch": 0.13, "learning_rate": 1.9524623666454243e-05, "loss": 1.4863, "step": 4599 }, { "epoch": 0.13, "learning_rate": 1.9524354158537788e-05, "loss": 1.4736, "step": 4600 }, { "epoch": 0.13, "learning_rate": 1.9524084576107258e-05, "loss": 1.3606, "step": 4601 }, { "epoch": 0.13, "learning_rate": 1.9523814919164775e-05, "loss": 1.4077, "step": 4602 }, { "epoch": 0.13, "learning_rate": 1.9523545187712435e-05, "loss": 1.3091, "step": 4603 }, { "epoch": 0.13, "learning_rate": 1.9523275381752364e-05, "loss": 1.2974, "step": 4604 }, { "epoch": 0.13, "learning_rate": 1.952300550128666e-05, "loss": 1.4458, "step": 4605 }, { "epoch": 0.13, "learning_rate": 1.952273554631744e-05, "loss": 1.3633, "step": 4606 }, { "epoch": 0.13, "learning_rate": 1.9522465516846815e-05, "loss": 1.5112, "step": 4607 }, { "epoch": 0.13, "learning_rate": 1.95221954128769e-05, "loss": 1.4727, "step": 4608 }, { "epoch": 0.13, "learning_rate": 1.95219252344098e-05, "loss": 1.2437, "step": 4609 }, { "epoch": 0.13, "learning_rate": 1.9521654981447637e-05, "loss": 1.3115, "step": 4610 }, { "epoch": 0.13, "learning_rate": 1.9521384653992525e-05, "loss": 1.3076, "step": 4611 }, { "epoch": 0.13, "learning_rate": 1.9521114252046576e-05, "loss": 1.3779, "step": 4612 }, { "epoch": 0.13, "learning_rate": 1.9520843775611907e-05, "loss": 1.48, "step": 4613 }, { "epoch": 0.13, "learning_rate": 1.952057322469063e-05, "loss": 1.5229, "step": 4614 }, { "epoch": 0.13, "learning_rate": 1.9520302599284866e-05, "loss": 1.5029, "step": 4615 }, { "epoch": 0.13, "learning_rate": 1.9520031899396735e-05, "loss": 1.5293, "step": 4616 }, { "epoch": 0.13, "learning_rate": 1.9519761125028344e-05, "loss": 1.4626, "step": 4617 }, { "epoch": 0.13, "learning_rate": 1.9519490276181826e-05, "loss": 1.4714, "step": 4618 }, { "epoch": 0.13, "learning_rate": 1.951921935285929e-05, "loss": 1.3413, "step": 4619 }, { "epoch": 0.13, "learning_rate": 1.9518948355062854e-05, "loss": 1.3508, "step": 4620 }, { "epoch": 0.13, "learning_rate": 1.951867728279465e-05, "loss": 1.4956, "step": 4621 }, { "epoch": 0.13, "learning_rate": 1.9518406136056784e-05, "loss": 1.4377, "step": 4622 }, { "epoch": 0.13, "learning_rate": 1.9518134914851384e-05, "loss": 1.4316, "step": 4623 }, { "epoch": 0.13, "learning_rate": 1.9517863619180577e-05, "loss": 1.4087, "step": 4624 }, { "epoch": 0.13, "learning_rate": 1.9517592249046476e-05, "loss": 1.5898, "step": 4625 }, { "epoch": 0.13, "learning_rate": 1.9517320804451214e-05, "loss": 1.5254, "step": 4626 }, { "epoch": 0.13, "learning_rate": 1.9517049285396907e-05, "loss": 1.3418, "step": 4627 }, { "epoch": 0.13, "learning_rate": 1.951677769188568e-05, "loss": 1.4551, "step": 4628 }, { "epoch": 0.13, "learning_rate": 1.951650602391966e-05, "loss": 1.4619, "step": 4629 }, { "epoch": 0.13, "learning_rate": 1.9516234281500972e-05, "loss": 1.3096, "step": 4630 }, { "epoch": 0.13, "learning_rate": 1.9515962464631744e-05, "loss": 1.4719, "step": 4631 }, { "epoch": 0.13, "learning_rate": 1.9515690573314097e-05, "loss": 1.4351, "step": 4632 }, { "epoch": 0.13, "learning_rate": 1.9515418607550162e-05, "loss": 1.4336, "step": 4633 }, { "epoch": 0.13, "learning_rate": 1.9515146567342066e-05, "loss": 1.397, "step": 4634 }, { "epoch": 0.13, "learning_rate": 1.951487445269194e-05, "loss": 1.5503, "step": 4635 }, { "epoch": 0.13, "learning_rate": 1.951460226360191e-05, "loss": 1.4106, "step": 4636 }, { "epoch": 0.13, "learning_rate": 1.9514330000074108e-05, "loss": 1.5391, "step": 4637 }, { "epoch": 0.13, "learning_rate": 1.9514057662110658e-05, "loss": 1.2078, "step": 4638 }, { "epoch": 0.13, "learning_rate": 1.9513785249713697e-05, "loss": 1.4385, "step": 4639 }, { "epoch": 0.13, "learning_rate": 1.9513512762885352e-05, "loss": 1.5479, "step": 4640 }, { "epoch": 0.13, "learning_rate": 1.9513240201627758e-05, "loss": 1.4641, "step": 4641 }, { "epoch": 0.13, "learning_rate": 1.9512967565943045e-05, "loss": 1.3162, "step": 4642 }, { "epoch": 0.13, "learning_rate": 1.951269485583335e-05, "loss": 1.3459, "step": 4643 }, { "epoch": 0.13, "learning_rate": 1.95124220713008e-05, "loss": 1.3577, "step": 4644 }, { "epoch": 0.13, "learning_rate": 1.9512149212347534e-05, "loss": 1.542, "step": 4645 }, { "epoch": 0.13, "learning_rate": 1.9511876278975688e-05, "loss": 1.3184, "step": 4646 }, { "epoch": 0.13, "learning_rate": 1.9511603271187393e-05, "loss": 1.4648, "step": 4647 }, { "epoch": 0.13, "learning_rate": 1.9511330188984786e-05, "loss": 1.6968, "step": 4648 }, { "epoch": 0.13, "learning_rate": 1.9511057032370004e-05, "loss": 1.3647, "step": 4649 }, { "epoch": 0.13, "learning_rate": 1.9510783801345182e-05, "loss": 1.2559, "step": 4650 }, { "epoch": 0.13, "learning_rate": 1.9510510495912464e-05, "loss": 1.5454, "step": 4651 }, { "epoch": 0.13, "learning_rate": 1.9510237116073983e-05, "loss": 1.4102, "step": 4652 }, { "epoch": 0.13, "learning_rate": 1.950996366183188e-05, "loss": 1.353, "step": 4653 }, { "epoch": 0.13, "learning_rate": 1.950969013318829e-05, "loss": 1.3574, "step": 4654 }, { "epoch": 0.13, "learning_rate": 1.950941653014536e-05, "loss": 1.3514, "step": 4655 }, { "epoch": 0.13, "learning_rate": 1.950914285270522e-05, "loss": 1.458, "step": 4656 }, { "epoch": 0.13, "learning_rate": 1.9508869100870024e-05, "loss": 1.4946, "step": 4657 }, { "epoch": 0.13, "learning_rate": 1.9508595274641906e-05, "loss": 1.3618, "step": 4658 }, { "epoch": 0.13, "learning_rate": 1.950832137402301e-05, "loss": 1.3296, "step": 4659 }, { "epoch": 0.13, "learning_rate": 1.950804739901548e-05, "loss": 1.4536, "step": 4660 }, { "epoch": 0.13, "learning_rate": 1.9507773349621454e-05, "loss": 1.583, "step": 4661 }, { "epoch": 0.13, "learning_rate": 1.9507499225843083e-05, "loss": 1.4285, "step": 4662 }, { "epoch": 0.13, "learning_rate": 1.9507225027682507e-05, "loss": 1.562, "step": 4663 }, { "epoch": 0.13, "learning_rate": 1.9506950755141875e-05, "loss": 1.6338, "step": 4664 }, { "epoch": 0.13, "learning_rate": 1.950667640822333e-05, "loss": 1.4084, "step": 4665 }, { "epoch": 0.13, "learning_rate": 1.950640198692902e-05, "loss": 1.5977, "step": 4666 }, { "epoch": 0.13, "learning_rate": 1.950612749126109e-05, "loss": 1.3008, "step": 4667 }, { "epoch": 0.13, "learning_rate": 1.950585292122169e-05, "loss": 1.3918, "step": 4668 }, { "epoch": 0.13, "learning_rate": 1.9505578276812964e-05, "loss": 1.5159, "step": 4669 }, { "epoch": 0.13, "learning_rate": 1.950530355803707e-05, "loss": 1.5103, "step": 4670 }, { "epoch": 0.13, "learning_rate": 1.9505028764896142e-05, "loss": 1.4233, "step": 4671 }, { "epoch": 0.13, "learning_rate": 1.9504753897392344e-05, "loss": 1.4768, "step": 4672 }, { "epoch": 0.13, "learning_rate": 1.9504478955527818e-05, "loss": 1.3135, "step": 4673 }, { "epoch": 0.13, "learning_rate": 1.950420393930472e-05, "loss": 1.4304, "step": 4674 }, { "epoch": 0.13, "learning_rate": 1.95039288487252e-05, "loss": 1.521, "step": 4675 }, { "epoch": 0.13, "learning_rate": 1.9503653683791408e-05, "loss": 1.439, "step": 4676 }, { "epoch": 0.13, "learning_rate": 1.95033784445055e-05, "loss": 1.5303, "step": 4677 }, { "epoch": 0.13, "learning_rate": 1.9503103130869624e-05, "loss": 1.5349, "step": 4678 }, { "epoch": 0.13, "learning_rate": 1.9502827742885943e-05, "loss": 1.3931, "step": 4679 }, { "epoch": 0.13, "learning_rate": 1.95025522805566e-05, "loss": 1.3755, "step": 4680 }, { "epoch": 0.13, "learning_rate": 1.9502276743883764e-05, "loss": 1.4858, "step": 4681 }, { "epoch": 0.13, "learning_rate": 1.950200113286958e-05, "loss": 1.2766, "step": 4682 }, { "epoch": 0.13, "learning_rate": 1.9501725447516205e-05, "loss": 1.4673, "step": 4683 }, { "epoch": 0.13, "learning_rate": 1.95014496878258e-05, "loss": 1.5132, "step": 4684 }, { "epoch": 0.13, "learning_rate": 1.9501173853800522e-05, "loss": 1.3032, "step": 4685 }, { "epoch": 0.13, "learning_rate": 1.9500897945442526e-05, "loss": 1.3118, "step": 4686 }, { "epoch": 0.13, "learning_rate": 1.950062196275397e-05, "loss": 1.177, "step": 4687 }, { "epoch": 0.13, "learning_rate": 1.9500345905737016e-05, "loss": 1.4907, "step": 4688 }, { "epoch": 0.13, "learning_rate": 1.9500069774393826e-05, "loss": 1.4619, "step": 4689 }, { "epoch": 0.13, "learning_rate": 1.9499793568726554e-05, "loss": 1.3828, "step": 4690 }, { "epoch": 0.13, "learning_rate": 1.949951728873737e-05, "loss": 1.4175, "step": 4691 }, { "epoch": 0.13, "learning_rate": 1.9499240934428422e-05, "loss": 1.5269, "step": 4692 }, { "epoch": 0.13, "learning_rate": 1.9498964505801885e-05, "loss": 1.5762, "step": 4693 }, { "epoch": 0.13, "learning_rate": 1.9498688002859913e-05, "loss": 1.5327, "step": 4694 }, { "epoch": 0.13, "learning_rate": 1.9498411425604677e-05, "loss": 1.7979, "step": 4695 }, { "epoch": 0.13, "learning_rate": 1.9498134774038333e-05, "loss": 1.4038, "step": 4696 }, { "epoch": 0.13, "learning_rate": 1.9497858048163053e-05, "loss": 1.5049, "step": 4697 }, { "epoch": 0.13, "learning_rate": 1.9497581247980993e-05, "loss": 1.4666, "step": 4698 }, { "epoch": 0.13, "learning_rate": 1.9497304373494324e-05, "loss": 1.5107, "step": 4699 }, { "epoch": 0.13, "learning_rate": 1.9497027424705214e-05, "loss": 1.4785, "step": 4700 }, { "epoch": 0.13, "learning_rate": 1.9496750401615826e-05, "loss": 1.3882, "step": 4701 }, { "epoch": 0.13, "learning_rate": 1.9496473304228327e-05, "loss": 1.5378, "step": 4702 }, { "epoch": 0.13, "learning_rate": 1.949619613254489e-05, "loss": 1.3408, "step": 4703 }, { "epoch": 0.13, "learning_rate": 1.9495918886567675e-05, "loss": 1.4824, "step": 4704 }, { "epoch": 0.13, "learning_rate": 1.9495641566298858e-05, "loss": 1.4492, "step": 4705 }, { "epoch": 0.13, "learning_rate": 1.949536417174061e-05, "loss": 1.4263, "step": 4706 }, { "epoch": 0.13, "learning_rate": 1.9495086702895093e-05, "loss": 1.6003, "step": 4707 }, { "epoch": 0.13, "learning_rate": 1.9494809159764484e-05, "loss": 1.5513, "step": 4708 }, { "epoch": 0.13, "learning_rate": 1.9494531542350953e-05, "loss": 1.4775, "step": 4709 }, { "epoch": 0.13, "learning_rate": 1.949425385065667e-05, "loss": 1.3752, "step": 4710 }, { "epoch": 0.13, "learning_rate": 1.9493976084683814e-05, "loss": 1.3979, "step": 4711 }, { "epoch": 0.13, "learning_rate": 1.9493698244434553e-05, "loss": 1.4993, "step": 4712 }, { "epoch": 0.13, "learning_rate": 1.9493420329911056e-05, "loss": 1.418, "step": 4713 }, { "epoch": 0.13, "learning_rate": 1.949314234111551e-05, "loss": 1.5522, "step": 4714 }, { "epoch": 0.13, "learning_rate": 1.9492864278050074e-05, "loss": 1.3896, "step": 4715 }, { "epoch": 0.13, "learning_rate": 1.9492586140716935e-05, "loss": 1.459, "step": 4716 }, { "epoch": 0.13, "learning_rate": 1.9492307929118272e-05, "loss": 1.5073, "step": 4717 }, { "epoch": 0.13, "learning_rate": 1.9492029643256246e-05, "loss": 1.4233, "step": 4718 }, { "epoch": 0.13, "learning_rate": 1.949175128313305e-05, "loss": 1.4634, "step": 4719 }, { "epoch": 0.13, "learning_rate": 1.949147284875085e-05, "loss": 1.3682, "step": 4720 }, { "epoch": 0.13, "learning_rate": 1.9491194340111834e-05, "loss": 1.5557, "step": 4721 }, { "epoch": 0.13, "learning_rate": 1.9490915757218176e-05, "loss": 1.4829, "step": 4722 }, { "epoch": 0.13, "learning_rate": 1.9490637100072054e-05, "loss": 1.5347, "step": 4723 }, { "epoch": 0.13, "learning_rate": 1.949035836867565e-05, "loss": 1.4585, "step": 4724 }, { "epoch": 0.13, "learning_rate": 1.9490079563031146e-05, "loss": 1.4141, "step": 4725 }, { "epoch": 0.13, "learning_rate": 1.9489800683140723e-05, "loss": 1.3975, "step": 4726 }, { "epoch": 0.13, "learning_rate": 1.948952172900656e-05, "loss": 1.4634, "step": 4727 }, { "epoch": 0.13, "learning_rate": 1.9489242700630842e-05, "loss": 1.4856, "step": 4728 }, { "epoch": 0.13, "learning_rate": 1.9488963598015752e-05, "loss": 1.3679, "step": 4729 }, { "epoch": 0.13, "learning_rate": 1.9488684421163472e-05, "loss": 1.4373, "step": 4730 }, { "epoch": 0.13, "learning_rate": 1.9488405170076188e-05, "loss": 1.3765, "step": 4731 }, { "epoch": 0.13, "learning_rate": 1.9488125844756084e-05, "loss": 1.249, "step": 4732 }, { "epoch": 0.13, "learning_rate": 1.9487846445205344e-05, "loss": 1.4373, "step": 4733 }, { "epoch": 0.13, "learning_rate": 1.9487566971426153e-05, "loss": 1.4688, "step": 4734 }, { "epoch": 0.13, "learning_rate": 1.94872874234207e-05, "loss": 1.427, "step": 4735 }, { "epoch": 0.13, "learning_rate": 1.9487007801191176e-05, "loss": 1.4082, "step": 4736 }, { "epoch": 0.13, "learning_rate": 1.948672810473976e-05, "loss": 1.457, "step": 4737 }, { "epoch": 0.13, "learning_rate": 1.9486448334068644e-05, "loss": 1.4712, "step": 4738 }, { "epoch": 0.13, "learning_rate": 1.948616848918002e-05, "loss": 1.4275, "step": 4739 }, { "epoch": 0.13, "learning_rate": 1.9485888570076074e-05, "loss": 1.5625, "step": 4740 }, { "epoch": 0.13, "learning_rate": 1.948560857675899e-05, "loss": 1.3213, "step": 4741 }, { "epoch": 0.13, "learning_rate": 1.948532850923097e-05, "loss": 1.4678, "step": 4742 }, { "epoch": 0.13, "learning_rate": 1.94850483674942e-05, "loss": 1.3252, "step": 4743 }, { "epoch": 0.13, "learning_rate": 1.9484768151550873e-05, "loss": 1.3137, "step": 4744 }, { "epoch": 0.13, "learning_rate": 1.9484487861403177e-05, "loss": 1.4636, "step": 4745 }, { "epoch": 0.13, "learning_rate": 1.9484207497053314e-05, "loss": 1.4656, "step": 4746 }, { "epoch": 0.13, "learning_rate": 1.9483927058503463e-05, "loss": 1.5337, "step": 4747 }, { "epoch": 0.13, "learning_rate": 1.9483646545755834e-05, "loss": 1.2903, "step": 4748 }, { "epoch": 0.13, "learning_rate": 1.9483365958812607e-05, "loss": 1.4609, "step": 4749 }, { "epoch": 0.13, "learning_rate": 1.948308529767599e-05, "loss": 1.3549, "step": 4750 }, { "epoch": 0.13, "learning_rate": 1.948280456234817e-05, "loss": 1.5552, "step": 4751 }, { "epoch": 0.13, "learning_rate": 1.9482523752831345e-05, "loss": 1.4258, "step": 4752 }, { "epoch": 0.13, "learning_rate": 1.9482242869127716e-05, "loss": 1.437, "step": 4753 }, { "epoch": 0.13, "learning_rate": 1.948196191123948e-05, "loss": 1.3726, "step": 4754 }, { "epoch": 0.13, "learning_rate": 1.9481680879168824e-05, "loss": 1.5356, "step": 4755 }, { "epoch": 0.13, "learning_rate": 1.948139977291796e-05, "loss": 1.4783, "step": 4756 }, { "epoch": 0.13, "learning_rate": 1.9481118592489086e-05, "loss": 1.4907, "step": 4757 }, { "epoch": 0.13, "learning_rate": 1.9480837337884397e-05, "loss": 1.3333, "step": 4758 }, { "epoch": 0.13, "learning_rate": 1.948055600910609e-05, "loss": 1.4763, "step": 4759 }, { "epoch": 0.13, "learning_rate": 1.9480274606156377e-05, "loss": 1.3745, "step": 4760 }, { "epoch": 0.13, "learning_rate": 1.947999312903745e-05, "loss": 1.3877, "step": 4761 }, { "epoch": 0.13, "learning_rate": 1.9479711577751513e-05, "loss": 1.4333, "step": 4762 }, { "epoch": 0.13, "learning_rate": 1.9479429952300773e-05, "loss": 1.4163, "step": 4763 }, { "epoch": 0.13, "learning_rate": 1.947914825268743e-05, "loss": 1.4946, "step": 4764 }, { "epoch": 0.13, "learning_rate": 1.947886647891369e-05, "loss": 1.4839, "step": 4765 }, { "epoch": 0.13, "learning_rate": 1.9478584630981754e-05, "loss": 1.5225, "step": 4766 }, { "epoch": 0.13, "learning_rate": 1.9478302708893832e-05, "loss": 1.4175, "step": 4767 }, { "epoch": 0.13, "learning_rate": 1.9478020712652122e-05, "loss": 1.2739, "step": 4768 }, { "epoch": 0.13, "learning_rate": 1.9477738642258838e-05, "loss": 1.4575, "step": 4769 }, { "epoch": 0.13, "learning_rate": 1.9477456497716184e-05, "loss": 1.5503, "step": 4770 }, { "epoch": 0.13, "learning_rate": 1.9477174279026364e-05, "loss": 1.5483, "step": 4771 }, { "epoch": 0.13, "learning_rate": 1.9476891986191592e-05, "loss": 1.4688, "step": 4772 }, { "epoch": 0.13, "learning_rate": 1.9476609619214072e-05, "loss": 1.5681, "step": 4773 }, { "epoch": 0.13, "learning_rate": 1.947632717809601e-05, "loss": 1.3557, "step": 4774 }, { "epoch": 0.13, "learning_rate": 1.9476044662839627e-05, "loss": 1.3682, "step": 4775 }, { "epoch": 0.13, "learning_rate": 1.9475762073447125e-05, "loss": 1.2874, "step": 4776 }, { "epoch": 0.13, "learning_rate": 1.9475479409920717e-05, "loss": 1.4883, "step": 4777 }, { "epoch": 0.13, "learning_rate": 1.947519667226261e-05, "loss": 1.5552, "step": 4778 }, { "epoch": 0.13, "learning_rate": 1.9474913860475026e-05, "loss": 1.4102, "step": 4779 }, { "epoch": 0.13, "learning_rate": 1.9474630974560165e-05, "loss": 1.4138, "step": 4780 }, { "epoch": 0.13, "learning_rate": 1.9474348014520248e-05, "loss": 1.3611, "step": 4781 }, { "epoch": 0.13, "learning_rate": 1.947406498035749e-05, "loss": 1.5601, "step": 4782 }, { "epoch": 0.13, "learning_rate": 1.94737818720741e-05, "loss": 1.4551, "step": 4783 }, { "epoch": 0.13, "learning_rate": 1.9473498689672298e-05, "loss": 1.3169, "step": 4784 }, { "epoch": 0.13, "learning_rate": 1.9473215433154292e-05, "loss": 1.4805, "step": 4785 }, { "epoch": 0.13, "learning_rate": 1.9472932102522312e-05, "loss": 1.3838, "step": 4786 }, { "epoch": 0.13, "learning_rate": 1.9472648697778558e-05, "loss": 1.4937, "step": 4787 }, { "epoch": 0.13, "learning_rate": 1.9472365218925255e-05, "loss": 1.4016, "step": 4788 }, { "epoch": 0.13, "learning_rate": 1.9472081665964622e-05, "loss": 1.4011, "step": 4789 }, { "epoch": 0.13, "learning_rate": 1.947179803889888e-05, "loss": 1.4343, "step": 4790 }, { "epoch": 0.13, "learning_rate": 1.947151433773024e-05, "loss": 1.4888, "step": 4791 }, { "epoch": 0.13, "learning_rate": 1.947123056246093e-05, "loss": 1.5278, "step": 4792 }, { "epoch": 0.13, "learning_rate": 1.947094671309316e-05, "loss": 1.3889, "step": 4793 }, { "epoch": 0.13, "learning_rate": 1.947066278962916e-05, "loss": 1.5708, "step": 4794 }, { "epoch": 0.13, "learning_rate": 1.9470378792071147e-05, "loss": 1.4688, "step": 4795 }, { "epoch": 0.13, "learning_rate": 1.9470094720421344e-05, "loss": 1.2185, "step": 4796 }, { "epoch": 0.13, "learning_rate": 1.946981057468197e-05, "loss": 1.479, "step": 4797 }, { "epoch": 0.13, "learning_rate": 1.9469526354855256e-05, "loss": 1.425, "step": 4798 }, { "epoch": 0.13, "learning_rate": 1.946924206094342e-05, "loss": 1.374, "step": 4799 }, { "epoch": 0.13, "learning_rate": 1.9468957692948684e-05, "loss": 1.4822, "step": 4800 }, { "epoch": 0.13, "learning_rate": 1.9468673250873275e-05, "loss": 1.4478, "step": 4801 }, { "epoch": 0.13, "learning_rate": 1.946838873471942e-05, "loss": 1.4551, "step": 4802 }, { "epoch": 0.13, "learning_rate": 1.9468104144489345e-05, "loss": 1.4019, "step": 4803 }, { "epoch": 0.13, "learning_rate": 1.9467819480185277e-05, "loss": 1.5659, "step": 4804 }, { "epoch": 0.13, "learning_rate": 1.946753474180944e-05, "loss": 1.4055, "step": 4805 }, { "epoch": 0.13, "learning_rate": 1.946724992936406e-05, "loss": 1.4038, "step": 4806 }, { "epoch": 0.13, "learning_rate": 1.9466965042851372e-05, "loss": 1.3472, "step": 4807 }, { "epoch": 0.13, "learning_rate": 1.94666800822736e-05, "loss": 1.4724, "step": 4808 }, { "epoch": 0.13, "learning_rate": 1.946639504763298e-05, "loss": 1.3352, "step": 4809 }, { "epoch": 0.13, "learning_rate": 1.9466109938931727e-05, "loss": 1.3774, "step": 4810 }, { "epoch": 0.13, "learning_rate": 1.9465824756172087e-05, "loss": 1.4597, "step": 4811 }, { "epoch": 0.13, "learning_rate": 1.9465539499356282e-05, "loss": 1.3918, "step": 4812 }, { "epoch": 0.13, "learning_rate": 1.9465254168486548e-05, "loss": 1.4248, "step": 4813 }, { "epoch": 0.13, "learning_rate": 1.9464968763565118e-05, "loss": 1.3633, "step": 4814 }, { "epoch": 0.13, "learning_rate": 1.9464683284594224e-05, "loss": 1.4746, "step": 4815 }, { "epoch": 0.13, "learning_rate": 1.9464397731576093e-05, "loss": 1.4224, "step": 4816 }, { "epoch": 0.13, "learning_rate": 1.9464112104512968e-05, "loss": 1.4888, "step": 4817 }, { "epoch": 0.13, "learning_rate": 1.9463826403407084e-05, "loss": 1.4722, "step": 4818 }, { "epoch": 0.13, "learning_rate": 1.9463540628260668e-05, "loss": 1.2761, "step": 4819 }, { "epoch": 0.13, "learning_rate": 1.9463254779075963e-05, "loss": 1.4827, "step": 4820 }, { "epoch": 0.13, "learning_rate": 1.94629688558552e-05, "loss": 1.3845, "step": 4821 }, { "epoch": 0.13, "learning_rate": 1.946268285860062e-05, "loss": 1.4414, "step": 4822 }, { "epoch": 0.13, "learning_rate": 1.9462396787314456e-05, "loss": 1.4041, "step": 4823 }, { "epoch": 0.13, "learning_rate": 1.946211064199895e-05, "loss": 1.4631, "step": 4824 }, { "epoch": 0.13, "learning_rate": 1.9461824422656345e-05, "loss": 1.4014, "step": 4825 }, { "epoch": 0.13, "learning_rate": 1.9461538129288867e-05, "loss": 1.3716, "step": 4826 }, { "epoch": 0.13, "learning_rate": 1.946125176189877e-05, "loss": 1.395, "step": 4827 }, { "epoch": 0.13, "learning_rate": 1.9460965320488285e-05, "loss": 1.4116, "step": 4828 }, { "epoch": 0.13, "learning_rate": 1.9460678805059657e-05, "loss": 1.3677, "step": 4829 }, { "epoch": 0.13, "learning_rate": 1.9460392215615126e-05, "loss": 1.8208, "step": 4830 }, { "epoch": 0.13, "learning_rate": 1.9460105552156937e-05, "loss": 1.4595, "step": 4831 }, { "epoch": 0.13, "learning_rate": 1.945981881468733e-05, "loss": 1.4504, "step": 4832 }, { "epoch": 0.13, "learning_rate": 1.9459532003208547e-05, "loss": 1.4783, "step": 4833 }, { "epoch": 0.13, "learning_rate": 1.9459245117722836e-05, "loss": 1.541, "step": 4834 }, { "epoch": 0.13, "learning_rate": 1.945895815823244e-05, "loss": 1.4954, "step": 4835 }, { "epoch": 0.13, "learning_rate": 1.94586711247396e-05, "loss": 1.4775, "step": 4836 }, { "epoch": 0.13, "learning_rate": 1.9458384017246566e-05, "loss": 1.4744, "step": 4837 }, { "epoch": 0.13, "learning_rate": 1.9458096835755583e-05, "loss": 1.4004, "step": 4838 }, { "epoch": 0.13, "learning_rate": 1.94578095802689e-05, "loss": 1.4546, "step": 4839 }, { "epoch": 0.13, "learning_rate": 1.9457522250788758e-05, "loss": 1.4365, "step": 4840 }, { "epoch": 0.13, "learning_rate": 1.9457234847317415e-05, "loss": 1.4961, "step": 4841 }, { "epoch": 0.13, "learning_rate": 1.9456947369857108e-05, "loss": 1.5747, "step": 4842 }, { "epoch": 0.13, "learning_rate": 1.9456659818410095e-05, "loss": 1.2717, "step": 4843 }, { "epoch": 0.13, "learning_rate": 1.9456372192978624e-05, "loss": 1.4514, "step": 4844 }, { "epoch": 0.13, "learning_rate": 1.945608449356494e-05, "loss": 1.4565, "step": 4845 }, { "epoch": 0.13, "learning_rate": 1.9455796720171298e-05, "loss": 1.5571, "step": 4846 }, { "epoch": 0.13, "learning_rate": 1.945550887279995e-05, "loss": 1.4626, "step": 4847 }, { "epoch": 0.13, "learning_rate": 1.9455220951453147e-05, "loss": 1.4917, "step": 4848 }, { "epoch": 0.13, "learning_rate": 1.9454932956133142e-05, "loss": 1.333, "step": 4849 }, { "epoch": 0.13, "learning_rate": 1.9454644886842183e-05, "loss": 1.3201, "step": 4850 }, { "epoch": 0.13, "learning_rate": 1.9454356743582534e-05, "loss": 1.4028, "step": 4851 }, { "epoch": 0.13, "learning_rate": 1.945406852635644e-05, "loss": 1.4434, "step": 4852 }, { "epoch": 0.13, "learning_rate": 1.945378023516616e-05, "loss": 1.4944, "step": 4853 }, { "epoch": 0.13, "learning_rate": 1.9453491870013952e-05, "loss": 1.4417, "step": 4854 }, { "epoch": 0.13, "learning_rate": 1.945320343090207e-05, "loss": 1.4775, "step": 4855 }, { "epoch": 0.13, "learning_rate": 1.9452914917832765e-05, "loss": 1.5244, "step": 4856 }, { "epoch": 0.13, "learning_rate": 1.94526263308083e-05, "loss": 1.4937, "step": 4857 }, { "epoch": 0.13, "learning_rate": 1.9452337669830932e-05, "loss": 1.3523, "step": 4858 }, { "epoch": 0.13, "learning_rate": 1.9452048934902916e-05, "loss": 1.5222, "step": 4859 }, { "epoch": 0.13, "learning_rate": 1.945176012602652e-05, "loss": 1.3809, "step": 4860 }, { "epoch": 0.13, "learning_rate": 1.9451471243203992e-05, "loss": 1.5581, "step": 4861 }, { "epoch": 0.13, "learning_rate": 1.94511822864376e-05, "loss": 1.2825, "step": 4862 }, { "epoch": 0.13, "learning_rate": 1.94508932557296e-05, "loss": 1.4526, "step": 4863 }, { "epoch": 0.13, "learning_rate": 1.9450604151082255e-05, "loss": 1.3748, "step": 4864 }, { "epoch": 0.13, "learning_rate": 1.945031497249783e-05, "loss": 1.4927, "step": 4865 }, { "epoch": 0.13, "learning_rate": 1.945002571997858e-05, "loss": 1.4902, "step": 4866 }, { "epoch": 0.13, "learning_rate": 1.9449736393526777e-05, "loss": 1.3457, "step": 4867 }, { "epoch": 0.13, "learning_rate": 1.9449446993144677e-05, "loss": 1.2511, "step": 4868 }, { "epoch": 0.13, "learning_rate": 1.944915751883455e-05, "loss": 1.3584, "step": 4869 }, { "epoch": 0.13, "learning_rate": 1.9448867970598658e-05, "loss": 1.3884, "step": 4870 }, { "epoch": 0.13, "learning_rate": 1.9448578348439263e-05, "loss": 1.4934, "step": 4871 }, { "epoch": 0.13, "learning_rate": 1.944828865235864e-05, "loss": 1.2668, "step": 4872 }, { "epoch": 0.13, "learning_rate": 1.944799888235904e-05, "loss": 1.2522, "step": 4873 }, { "epoch": 0.13, "learning_rate": 1.9447709038442748e-05, "loss": 1.4595, "step": 4874 }, { "epoch": 0.13, "learning_rate": 1.9447419120612018e-05, "loss": 1.4827, "step": 4875 }, { "epoch": 0.13, "learning_rate": 1.9447129128869126e-05, "loss": 1.449, "step": 4876 }, { "epoch": 0.13, "learning_rate": 1.9446839063216337e-05, "loss": 1.5269, "step": 4877 }, { "epoch": 0.13, "learning_rate": 1.9446548923655923e-05, "loss": 1.4543, "step": 4878 }, { "epoch": 0.13, "learning_rate": 1.9446258710190152e-05, "loss": 1.3076, "step": 4879 }, { "epoch": 0.13, "learning_rate": 1.9445968422821292e-05, "loss": 1.542, "step": 4880 }, { "epoch": 0.13, "learning_rate": 1.944567806155162e-05, "loss": 1.3113, "step": 4881 }, { "epoch": 0.13, "learning_rate": 1.9445387626383402e-05, "loss": 1.4199, "step": 4882 }, { "epoch": 0.13, "learning_rate": 1.9445097117318915e-05, "loss": 1.5068, "step": 4883 }, { "epoch": 0.13, "learning_rate": 1.944480653436043e-05, "loss": 1.4436, "step": 4884 }, { "epoch": 0.13, "learning_rate": 1.9444515877510213e-05, "loss": 1.512, "step": 4885 }, { "epoch": 0.13, "learning_rate": 1.9444225146770553e-05, "loss": 1.3901, "step": 4886 }, { "epoch": 0.13, "learning_rate": 1.944393434214371e-05, "loss": 1.5596, "step": 4887 }, { "epoch": 0.13, "learning_rate": 1.944364346363197e-05, "loss": 1.4192, "step": 4888 }, { "epoch": 0.13, "learning_rate": 1.9443352511237604e-05, "loss": 1.8076, "step": 4889 }, { "epoch": 0.13, "learning_rate": 1.944306148496289e-05, "loss": 1.4036, "step": 4890 }, { "epoch": 0.13, "learning_rate": 1.94427703848101e-05, "loss": 1.386, "step": 4891 }, { "epoch": 0.13, "learning_rate": 1.9442479210781514e-05, "loss": 1.3687, "step": 4892 }, { "epoch": 0.13, "learning_rate": 1.9442187962879417e-05, "loss": 1.77, "step": 4893 }, { "epoch": 0.13, "learning_rate": 1.944189664110608e-05, "loss": 1.2832, "step": 4894 }, { "epoch": 0.13, "learning_rate": 1.9441605245463776e-05, "loss": 1.2109, "step": 4895 }, { "epoch": 0.13, "learning_rate": 1.9441313775954796e-05, "loss": 1.323, "step": 4896 }, { "epoch": 0.13, "learning_rate": 1.944102223258142e-05, "loss": 1.3582, "step": 4897 }, { "epoch": 0.13, "learning_rate": 1.9440730615345923e-05, "loss": 1.3271, "step": 4898 }, { "epoch": 0.13, "learning_rate": 1.944043892425059e-05, "loss": 1.4814, "step": 4899 }, { "epoch": 0.13, "learning_rate": 1.94401471592977e-05, "loss": 1.4248, "step": 4900 }, { "epoch": 0.13, "learning_rate": 1.943985532048954e-05, "loss": 1.4448, "step": 4901 }, { "epoch": 0.13, "learning_rate": 1.943956340782839e-05, "loss": 1.53, "step": 4902 }, { "epoch": 0.13, "learning_rate": 1.9439271421316535e-05, "loss": 1.4834, "step": 4903 }, { "epoch": 0.13, "learning_rate": 1.9438979360956257e-05, "loss": 1.5547, "step": 4904 }, { "epoch": 0.13, "learning_rate": 1.9438687226749848e-05, "loss": 1.4683, "step": 4905 }, { "epoch": 0.13, "learning_rate": 1.9438395018699584e-05, "loss": 1.3765, "step": 4906 }, { "epoch": 0.13, "learning_rate": 1.943810273680776e-05, "loss": 1.4741, "step": 4907 }, { "epoch": 0.13, "learning_rate": 1.9437810381076653e-05, "loss": 1.4028, "step": 4908 }, { "epoch": 0.13, "learning_rate": 1.9437517951508557e-05, "loss": 1.4392, "step": 4909 }, { "epoch": 0.13, "learning_rate": 1.943722544810576e-05, "loss": 1.4878, "step": 4910 }, { "epoch": 0.13, "learning_rate": 1.943693287087055e-05, "loss": 1.4619, "step": 4911 }, { "epoch": 0.13, "learning_rate": 1.943664021980521e-05, "loss": 1.4165, "step": 4912 }, { "epoch": 0.13, "learning_rate": 1.9436347494912038e-05, "loss": 1.5518, "step": 4913 }, { "epoch": 0.13, "learning_rate": 1.943605469619332e-05, "loss": 1.4163, "step": 4914 }, { "epoch": 0.13, "learning_rate": 1.9435761823651346e-05, "loss": 1.4663, "step": 4915 }, { "epoch": 0.13, "learning_rate": 1.9435468877288408e-05, "loss": 1.5266, "step": 4916 }, { "epoch": 0.13, "learning_rate": 1.94351758571068e-05, "loss": 1.4771, "step": 4917 }, { "epoch": 0.13, "learning_rate": 1.9434882763108814e-05, "loss": 1.8555, "step": 4918 }, { "epoch": 0.13, "learning_rate": 1.943458959529674e-05, "loss": 1.4646, "step": 4919 }, { "epoch": 0.13, "learning_rate": 1.9434296353672875e-05, "loss": 1.3735, "step": 4920 }, { "epoch": 0.13, "learning_rate": 1.943400303823951e-05, "loss": 1.4131, "step": 4921 }, { "epoch": 0.13, "learning_rate": 1.9433709648998943e-05, "loss": 1.3499, "step": 4922 }, { "epoch": 0.13, "learning_rate": 1.9433416185953466e-05, "loss": 1.4316, "step": 4923 }, { "epoch": 0.13, "learning_rate": 1.9433122649105375e-05, "loss": 1.3618, "step": 4924 }, { "epoch": 0.13, "learning_rate": 1.943282903845697e-05, "loss": 1.2795, "step": 4925 }, { "epoch": 0.13, "learning_rate": 1.9432535354010546e-05, "loss": 1.3828, "step": 4926 }, { "epoch": 0.13, "learning_rate": 1.9432241595768405e-05, "loss": 1.3855, "step": 4927 }, { "epoch": 0.13, "learning_rate": 1.943194776373284e-05, "loss": 1.4253, "step": 4928 }, { "epoch": 0.13, "learning_rate": 1.9431653857906147e-05, "loss": 1.3425, "step": 4929 }, { "epoch": 0.13, "learning_rate": 1.943135987829063e-05, "loss": 1.4656, "step": 4930 }, { "epoch": 0.13, "learning_rate": 1.9431065824888587e-05, "loss": 1.3994, "step": 4931 }, { "epoch": 0.13, "learning_rate": 1.9430771697702324e-05, "loss": 1.3818, "step": 4932 }, { "epoch": 0.13, "learning_rate": 1.9430477496734134e-05, "loss": 1.4495, "step": 4933 }, { "epoch": 0.13, "learning_rate": 1.9430183221986325e-05, "loss": 1.3052, "step": 4934 }, { "epoch": 0.13, "learning_rate": 1.9429888873461194e-05, "loss": 1.2893, "step": 4935 }, { "epoch": 0.13, "learning_rate": 1.9429594451161052e-05, "loss": 1.4146, "step": 4936 }, { "epoch": 0.13, "learning_rate": 1.9429299955088196e-05, "loss": 1.4626, "step": 4937 }, { "epoch": 0.13, "learning_rate": 1.9429005385244927e-05, "loss": 1.4368, "step": 4938 }, { "epoch": 0.13, "learning_rate": 1.9428710741633554e-05, "loss": 1.3701, "step": 4939 }, { "epoch": 0.13, "learning_rate": 1.9428416024256383e-05, "loss": 1.5356, "step": 4940 }, { "epoch": 0.13, "learning_rate": 1.942812123311572e-05, "loss": 1.1704, "step": 4941 }, { "epoch": 0.13, "learning_rate": 1.942782636821387e-05, "loss": 1.4109, "step": 4942 }, { "epoch": 0.13, "learning_rate": 1.942753142955314e-05, "loss": 1.4409, "step": 4943 }, { "epoch": 0.14, "learning_rate": 1.9427236417135837e-05, "loss": 1.4753, "step": 4944 }, { "epoch": 0.14, "learning_rate": 1.9426941330964267e-05, "loss": 1.499, "step": 4945 }, { "epoch": 0.14, "learning_rate": 1.9426646171040743e-05, "loss": 1.4609, "step": 4946 }, { "epoch": 0.14, "learning_rate": 1.9426350937367572e-05, "loss": 1.3707, "step": 4947 }, { "epoch": 0.14, "learning_rate": 1.9426055629947063e-05, "loss": 1.6245, "step": 4948 }, { "epoch": 0.14, "learning_rate": 1.9425760248781525e-05, "loss": 1.3748, "step": 4949 }, { "epoch": 0.14, "learning_rate": 1.9425464793873275e-05, "loss": 1.4282, "step": 4950 }, { "epoch": 0.14, "learning_rate": 1.942516926522462e-05, "loss": 1.314, "step": 4951 }, { "epoch": 0.14, "learning_rate": 1.9424873662837875e-05, "loss": 1.2448, "step": 4952 }, { "epoch": 0.14, "learning_rate": 1.9424577986715345e-05, "loss": 1.2935, "step": 4953 }, { "epoch": 0.14, "learning_rate": 1.9424282236859347e-05, "loss": 1.3623, "step": 4954 }, { "epoch": 0.14, "learning_rate": 1.9423986413272204e-05, "loss": 1.4321, "step": 4955 }, { "epoch": 0.14, "learning_rate": 1.942369051595622e-05, "loss": 1.2744, "step": 4956 }, { "epoch": 0.14, "learning_rate": 1.9423394544913708e-05, "loss": 1.5591, "step": 4957 }, { "epoch": 0.14, "learning_rate": 1.9423098500146994e-05, "loss": 1.5437, "step": 4958 }, { "epoch": 0.14, "learning_rate": 1.9422802381658384e-05, "loss": 1.4468, "step": 4959 }, { "epoch": 0.14, "learning_rate": 1.9422506189450203e-05, "loss": 1.4875, "step": 4960 }, { "epoch": 0.14, "learning_rate": 1.9422209923524766e-05, "loss": 1.4893, "step": 4961 }, { "epoch": 0.14, "learning_rate": 1.9421913583884385e-05, "loss": 1.4419, "step": 4962 }, { "epoch": 0.14, "learning_rate": 1.9421617170531382e-05, "loss": 1.3999, "step": 4963 }, { "epoch": 0.14, "learning_rate": 1.9421320683468078e-05, "loss": 1.5176, "step": 4964 }, { "epoch": 0.14, "learning_rate": 1.9421024122696793e-05, "loss": 1.271, "step": 4965 }, { "epoch": 0.14, "learning_rate": 1.9420727488219842e-05, "loss": 1.3457, "step": 4966 }, { "epoch": 0.14, "learning_rate": 1.9420430780039553e-05, "loss": 1.4634, "step": 4967 }, { "epoch": 0.14, "learning_rate": 1.942013399815824e-05, "loss": 1.4016, "step": 4968 }, { "epoch": 0.14, "learning_rate": 1.9419837142578228e-05, "loss": 1.4517, "step": 4969 }, { "epoch": 0.14, "learning_rate": 1.9419540213301845e-05, "loss": 1.4243, "step": 4970 }, { "epoch": 0.14, "learning_rate": 1.9419243210331403e-05, "loss": 1.3953, "step": 4971 }, { "epoch": 0.14, "learning_rate": 1.9418946133669233e-05, "loss": 1.4966, "step": 4972 }, { "epoch": 0.14, "learning_rate": 1.9418648983317657e-05, "loss": 1.5903, "step": 4973 }, { "epoch": 0.14, "learning_rate": 1.9418351759279002e-05, "loss": 1.3472, "step": 4974 }, { "epoch": 0.14, "learning_rate": 1.941805446155559e-05, "loss": 1.2703, "step": 4975 }, { "epoch": 0.14, "learning_rate": 1.9417757090149752e-05, "loss": 1.3853, "step": 4976 }, { "epoch": 0.14, "learning_rate": 1.941745964506381e-05, "loss": 1.4214, "step": 4977 }, { "epoch": 0.14, "learning_rate": 1.9417162126300087e-05, "loss": 1.5244, "step": 4978 }, { "epoch": 0.14, "learning_rate": 1.941686453386092e-05, "loss": 1.5308, "step": 4979 }, { "epoch": 0.14, "learning_rate": 1.9416566867748632e-05, "loss": 1.4648, "step": 4980 }, { "epoch": 0.14, "learning_rate": 1.941626912796555e-05, "loss": 1.2305, "step": 4981 }, { "epoch": 0.14, "learning_rate": 1.9415971314514012e-05, "loss": 1.3113, "step": 4982 }, { "epoch": 0.14, "learning_rate": 1.941567342739634e-05, "loss": 1.2502, "step": 4983 }, { "epoch": 0.14, "learning_rate": 1.9415375466614867e-05, "loss": 1.3611, "step": 4984 }, { "epoch": 0.14, "learning_rate": 1.941507743217192e-05, "loss": 1.4282, "step": 4985 }, { "epoch": 0.14, "learning_rate": 1.941477932406984e-05, "loss": 1.5027, "step": 4986 }, { "epoch": 0.14, "learning_rate": 1.941448114231095e-05, "loss": 1.354, "step": 4987 }, { "epoch": 0.14, "learning_rate": 1.941418288689759e-05, "loss": 1.3884, "step": 4988 }, { "epoch": 0.14, "learning_rate": 1.9413884557832084e-05, "loss": 1.3901, "step": 4989 }, { "epoch": 0.14, "learning_rate": 1.9413586155116776e-05, "loss": 1.4294, "step": 4990 }, { "epoch": 0.14, "learning_rate": 1.9413287678754e-05, "loss": 1.5278, "step": 4991 }, { "epoch": 0.14, "learning_rate": 1.9412989128746083e-05, "loss": 1.4663, "step": 4992 }, { "epoch": 0.14, "learning_rate": 1.9412690505095363e-05, "loss": 1.3594, "step": 4993 }, { "epoch": 0.14, "learning_rate": 1.9412391807804184e-05, "loss": 1.4043, "step": 4994 }, { "epoch": 0.14, "learning_rate": 1.9412093036874876e-05, "loss": 1.3914, "step": 4995 }, { "epoch": 0.14, "learning_rate": 1.9411794192309777e-05, "loss": 1.5044, "step": 4996 }, { "epoch": 0.14, "learning_rate": 1.9411495274111224e-05, "loss": 1.3726, "step": 4997 }, { "epoch": 0.14, "learning_rate": 1.941119628228156e-05, "loss": 1.4568, "step": 4998 }, { "epoch": 0.14, "learning_rate": 1.941089721682312e-05, "loss": 1.4299, "step": 4999 }, { "epoch": 0.14, "learning_rate": 1.941059807773825e-05, "loss": 1.3477, "step": 5000 }, { "epoch": 0.14, "learning_rate": 1.941029886502928e-05, "loss": 1.4323, "step": 5001 }, { "epoch": 0.14, "learning_rate": 1.940999957869856e-05, "loss": 1.3328, "step": 5002 }, { "epoch": 0.14, "learning_rate": 1.940970021874843e-05, "loss": 1.3909, "step": 5003 }, { "epoch": 0.14, "learning_rate": 1.9409400785181227e-05, "loss": 1.2336, "step": 5004 }, { "epoch": 0.14, "learning_rate": 1.9409101277999296e-05, "loss": 1.4568, "step": 5005 }, { "epoch": 0.14, "learning_rate": 1.9408801697204985e-05, "loss": 1.3086, "step": 5006 }, { "epoch": 0.14, "learning_rate": 1.940850204280063e-05, "loss": 1.3606, "step": 5007 }, { "epoch": 0.14, "learning_rate": 1.940820231478858e-05, "loss": 1.2358, "step": 5008 }, { "epoch": 0.14, "learning_rate": 1.940790251317118e-05, "loss": 1.3348, "step": 5009 }, { "epoch": 0.14, "learning_rate": 1.9407602637950775e-05, "loss": 1.4626, "step": 5010 }, { "epoch": 0.14, "learning_rate": 1.940730268912971e-05, "loss": 1.4421, "step": 5011 }, { "epoch": 0.14, "learning_rate": 1.9407002666710334e-05, "loss": 1.3718, "step": 5012 }, { "epoch": 0.14, "learning_rate": 1.940670257069499e-05, "loss": 1.3535, "step": 5013 }, { "epoch": 0.14, "learning_rate": 1.940640240108603e-05, "loss": 1.5645, "step": 5014 }, { "epoch": 0.14, "learning_rate": 1.9406102157885802e-05, "loss": 1.6304, "step": 5015 }, { "epoch": 0.14, "learning_rate": 1.940580184109665e-05, "loss": 1.4653, "step": 5016 }, { "epoch": 0.14, "learning_rate": 1.940550145072093e-05, "loss": 1.3713, "step": 5017 }, { "epoch": 0.14, "learning_rate": 1.940520098676099e-05, "loss": 1.376, "step": 5018 }, { "epoch": 0.14, "learning_rate": 1.9404900449219178e-05, "loss": 1.408, "step": 5019 }, { "epoch": 0.14, "learning_rate": 1.9404599838097852e-05, "loss": 1.3411, "step": 5020 }, { "epoch": 0.14, "learning_rate": 1.9404299153399355e-05, "loss": 1.4348, "step": 5021 }, { "epoch": 0.14, "learning_rate": 1.9403998395126044e-05, "loss": 1.1567, "step": 5022 }, { "epoch": 0.14, "learning_rate": 1.9403697563280275e-05, "loss": 1.4849, "step": 5023 }, { "epoch": 0.14, "learning_rate": 1.940339665786439e-05, "loss": 1.3125, "step": 5024 }, { "epoch": 0.14, "learning_rate": 1.940309567888076e-05, "loss": 1.5073, "step": 5025 }, { "epoch": 0.14, "learning_rate": 1.9402794626331727e-05, "loss": 1.3594, "step": 5026 }, { "epoch": 0.14, "learning_rate": 1.940249350021965e-05, "loss": 1.3064, "step": 5027 }, { "epoch": 0.14, "learning_rate": 1.9402192300546887e-05, "loss": 1.4331, "step": 5028 }, { "epoch": 0.14, "learning_rate": 1.9401891027315793e-05, "loss": 1.3486, "step": 5029 }, { "epoch": 0.14, "learning_rate": 1.9401589680528724e-05, "loss": 1.3638, "step": 5030 }, { "epoch": 0.14, "learning_rate": 1.9401288260188037e-05, "loss": 1.5347, "step": 5031 }, { "epoch": 0.14, "learning_rate": 1.9400986766296092e-05, "loss": 1.4778, "step": 5032 }, { "epoch": 0.14, "learning_rate": 1.940068519885525e-05, "loss": 1.4448, "step": 5033 }, { "epoch": 0.14, "learning_rate": 1.9400383557867864e-05, "loss": 1.3682, "step": 5034 }, { "epoch": 0.14, "learning_rate": 1.9400081843336298e-05, "loss": 1.4761, "step": 5035 }, { "epoch": 0.14, "learning_rate": 1.9399780055262912e-05, "loss": 1.5774, "step": 5036 }, { "epoch": 0.14, "learning_rate": 1.9399478193650068e-05, "loss": 1.4285, "step": 5037 }, { "epoch": 0.14, "learning_rate": 1.9399176258500127e-05, "loss": 1.3589, "step": 5038 }, { "epoch": 0.14, "learning_rate": 1.9398874249815448e-05, "loss": 1.4592, "step": 5039 }, { "epoch": 0.14, "learning_rate": 1.93985721675984e-05, "loss": 1.301, "step": 5040 }, { "epoch": 0.14, "learning_rate": 1.939827001185134e-05, "loss": 1.406, "step": 5041 }, { "epoch": 0.14, "learning_rate": 1.9397967782576636e-05, "loss": 1.3909, "step": 5042 }, { "epoch": 0.14, "learning_rate": 1.939766547977665e-05, "loss": 1.3333, "step": 5043 }, { "epoch": 0.14, "learning_rate": 1.9397363103453752e-05, "loss": 1.4219, "step": 5044 }, { "epoch": 0.14, "learning_rate": 1.93970606536103e-05, "loss": 1.5269, "step": 5045 }, { "epoch": 0.14, "learning_rate": 1.9396758130248665e-05, "loss": 1.3213, "step": 5046 }, { "epoch": 0.14, "learning_rate": 1.9396455533371216e-05, "loss": 1.4185, "step": 5047 }, { "epoch": 0.14, "learning_rate": 1.9396152862980315e-05, "loss": 1.4028, "step": 5048 }, { "epoch": 0.14, "learning_rate": 1.9395850119078333e-05, "loss": 1.3901, "step": 5049 }, { "epoch": 0.14, "learning_rate": 1.9395547301667636e-05, "loss": 1.5854, "step": 5050 }, { "epoch": 0.14, "learning_rate": 1.9395244410750597e-05, "loss": 1.4614, "step": 5051 }, { "epoch": 0.14, "learning_rate": 1.9394941446329583e-05, "loss": 1.324, "step": 5052 }, { "epoch": 0.14, "learning_rate": 1.9394638408406964e-05, "loss": 1.5017, "step": 5053 }, { "epoch": 0.14, "learning_rate": 1.9394335296985117e-05, "loss": 1.5413, "step": 5054 }, { "epoch": 0.14, "learning_rate": 1.9394032112066405e-05, "loss": 1.447, "step": 5055 }, { "epoch": 0.14, "learning_rate": 1.93937288536532e-05, "loss": 1.5039, "step": 5056 }, { "epoch": 0.14, "learning_rate": 1.939342552174788e-05, "loss": 1.4558, "step": 5057 }, { "epoch": 0.14, "learning_rate": 1.9393122116352816e-05, "loss": 1.3103, "step": 5058 }, { "epoch": 0.14, "learning_rate": 1.939281863747038e-05, "loss": 1.553, "step": 5059 }, { "epoch": 0.14, "learning_rate": 1.939251508510295e-05, "loss": 1.3003, "step": 5060 }, { "epoch": 0.14, "learning_rate": 1.9392211459252896e-05, "loss": 1.4062, "step": 5061 }, { "epoch": 0.14, "learning_rate": 1.93919077599226e-05, "loss": 1.3762, "step": 5062 }, { "epoch": 0.14, "learning_rate": 1.939160398711443e-05, "loss": 1.3855, "step": 5063 }, { "epoch": 0.14, "learning_rate": 1.939130014083077e-05, "loss": 1.5293, "step": 5064 }, { "epoch": 0.14, "learning_rate": 1.9390996221073994e-05, "loss": 1.5449, "step": 5065 }, { "epoch": 0.14, "learning_rate": 1.9390692227846478e-05, "loss": 1.4404, "step": 5066 }, { "epoch": 0.14, "learning_rate": 1.93903881611506e-05, "loss": 1.395, "step": 5067 }, { "epoch": 0.14, "learning_rate": 1.9390084020988743e-05, "loss": 1.55, "step": 5068 }, { "epoch": 0.14, "learning_rate": 1.9389779807363282e-05, "loss": 1.4858, "step": 5069 }, { "epoch": 0.14, "learning_rate": 1.93894755202766e-05, "loss": 1.4631, "step": 5070 }, { "epoch": 0.14, "learning_rate": 1.9389171159731076e-05, "loss": 1.4543, "step": 5071 }, { "epoch": 0.14, "learning_rate": 1.9388866725729095e-05, "loss": 1.7798, "step": 5072 }, { "epoch": 0.14, "learning_rate": 1.9388562218273034e-05, "loss": 1.4521, "step": 5073 }, { "epoch": 0.14, "learning_rate": 1.938825763736528e-05, "loss": 1.425, "step": 5074 }, { "epoch": 0.14, "learning_rate": 1.938795298300821e-05, "loss": 1.3965, "step": 5075 }, { "epoch": 0.14, "learning_rate": 1.938764825520421e-05, "loss": 1.219, "step": 5076 }, { "epoch": 0.14, "learning_rate": 1.9387343453955664e-05, "loss": 1.4668, "step": 5077 }, { "epoch": 0.14, "learning_rate": 1.9387038579264955e-05, "loss": 1.5347, "step": 5078 }, { "epoch": 0.14, "learning_rate": 1.9386733631134477e-05, "loss": 1.2153, "step": 5079 }, { "epoch": 0.14, "learning_rate": 1.9386428609566604e-05, "loss": 1.4126, "step": 5080 }, { "epoch": 0.14, "learning_rate": 1.9386123514563727e-05, "loss": 1.4189, "step": 5081 }, { "epoch": 0.14, "learning_rate": 1.9385818346128236e-05, "loss": 1.4717, "step": 5082 }, { "epoch": 0.14, "learning_rate": 1.9385513104262514e-05, "loss": 1.4758, "step": 5083 }, { "epoch": 0.14, "learning_rate": 1.9385207788968952e-05, "loss": 1.4346, "step": 5084 }, { "epoch": 0.14, "learning_rate": 1.9384902400249936e-05, "loss": 1.4338, "step": 5085 }, { "epoch": 0.14, "learning_rate": 1.9384596938107857e-05, "loss": 1.3555, "step": 5086 }, { "epoch": 0.14, "learning_rate": 1.9384291402545106e-05, "loss": 1.4272, "step": 5087 }, { "epoch": 0.14, "learning_rate": 1.9383985793564072e-05, "loss": 1.7837, "step": 5088 }, { "epoch": 0.14, "learning_rate": 1.9383680111167146e-05, "loss": 1.5754, "step": 5089 }, { "epoch": 0.14, "learning_rate": 1.938337435535672e-05, "loss": 1.3276, "step": 5090 }, { "epoch": 0.14, "learning_rate": 1.938306852613518e-05, "loss": 1.3027, "step": 5091 }, { "epoch": 0.14, "learning_rate": 1.938276262350493e-05, "loss": 1.5229, "step": 5092 }, { "epoch": 0.14, "learning_rate": 1.9382456647468352e-05, "loss": 1.4277, "step": 5093 }, { "epoch": 0.14, "learning_rate": 1.938215059802785e-05, "loss": 1.3181, "step": 5094 }, { "epoch": 0.14, "learning_rate": 1.938184447518581e-05, "loss": 1.417, "step": 5095 }, { "epoch": 0.14, "learning_rate": 1.9381538278944634e-05, "loss": 1.283, "step": 5096 }, { "epoch": 0.14, "learning_rate": 1.938123200930671e-05, "loss": 1.5762, "step": 5097 }, { "epoch": 0.14, "learning_rate": 1.9380925666274444e-05, "loss": 1.4956, "step": 5098 }, { "epoch": 0.14, "learning_rate": 1.938061924985022e-05, "loss": 1.3196, "step": 5099 }, { "epoch": 0.14, "learning_rate": 1.9380312760036447e-05, "loss": 1.3345, "step": 5100 }, { "epoch": 0.14, "learning_rate": 1.9380006196835516e-05, "loss": 1.5435, "step": 5101 }, { "epoch": 0.14, "learning_rate": 1.937969956024983e-05, "loss": 1.4375, "step": 5102 }, { "epoch": 0.14, "learning_rate": 1.937939285028178e-05, "loss": 1.2659, "step": 5103 }, { "epoch": 0.14, "learning_rate": 1.937908606693377e-05, "loss": 1.4775, "step": 5104 }, { "epoch": 0.14, "learning_rate": 1.9378779210208208e-05, "loss": 1.5618, "step": 5105 }, { "epoch": 0.14, "learning_rate": 1.9378472280107485e-05, "loss": 1.4082, "step": 5106 }, { "epoch": 0.14, "learning_rate": 1.9378165276634003e-05, "loss": 1.3323, "step": 5107 }, { "epoch": 0.14, "learning_rate": 1.9377858199790167e-05, "loss": 1.4238, "step": 5108 }, { "epoch": 0.14, "learning_rate": 1.9377551049578378e-05, "loss": 1.3721, "step": 5109 }, { "epoch": 0.14, "learning_rate": 1.937724382600104e-05, "loss": 1.5063, "step": 5110 }, { "epoch": 0.14, "learning_rate": 1.9376936529060556e-05, "loss": 1.2322, "step": 5111 }, { "epoch": 0.14, "learning_rate": 1.9376629158759327e-05, "loss": 1.5049, "step": 5112 }, { "epoch": 0.14, "learning_rate": 1.9376321715099763e-05, "loss": 1.3801, "step": 5113 }, { "epoch": 0.14, "learning_rate": 1.9376014198084266e-05, "loss": 1.5303, "step": 5114 }, { "epoch": 0.14, "learning_rate": 1.9375706607715245e-05, "loss": 1.4546, "step": 5115 }, { "epoch": 0.14, "learning_rate": 1.9375398943995105e-05, "loss": 1.2549, "step": 5116 }, { "epoch": 0.14, "learning_rate": 1.9375091206926248e-05, "loss": 1.3196, "step": 5117 }, { "epoch": 0.14, "learning_rate": 1.9374783396511088e-05, "loss": 1.4199, "step": 5118 }, { "epoch": 0.14, "learning_rate": 1.9374475512752032e-05, "loss": 1.3599, "step": 5119 }, { "epoch": 0.14, "learning_rate": 1.9374167555651487e-05, "loss": 1.4585, "step": 5120 }, { "epoch": 0.14, "learning_rate": 1.937385952521186e-05, "loss": 1.3818, "step": 5121 }, { "epoch": 0.14, "learning_rate": 1.9373551421435567e-05, "loss": 1.4966, "step": 5122 }, { "epoch": 0.14, "learning_rate": 1.9373243244325018e-05, "loss": 1.4739, "step": 5123 }, { "epoch": 0.14, "learning_rate": 1.9372934993882614e-05, "loss": 1.3779, "step": 5124 }, { "epoch": 0.14, "learning_rate": 1.9372626670110783e-05, "loss": 1.4482, "step": 5125 }, { "epoch": 0.14, "learning_rate": 1.9372318273011923e-05, "loss": 1.3801, "step": 5126 }, { "epoch": 0.14, "learning_rate": 1.9372009802588452e-05, "loss": 1.3347, "step": 5127 }, { "epoch": 0.14, "learning_rate": 1.9371701258842785e-05, "loss": 1.3682, "step": 5128 }, { "epoch": 0.14, "learning_rate": 1.9371392641777332e-05, "loss": 1.4287, "step": 5129 }, { "epoch": 0.14, "learning_rate": 1.9371083951394513e-05, "loss": 1.4324, "step": 5130 }, { "epoch": 0.14, "learning_rate": 1.9370775187696737e-05, "loss": 1.459, "step": 5131 }, { "epoch": 0.14, "learning_rate": 1.9370466350686423e-05, "loss": 1.1006, "step": 5132 }, { "epoch": 0.14, "learning_rate": 1.9370157440365987e-05, "loss": 1.3079, "step": 5133 }, { "epoch": 0.14, "learning_rate": 1.9369848456737848e-05, "loss": 1.9175, "step": 5134 }, { "epoch": 0.14, "learning_rate": 1.9369539399804415e-05, "loss": 1.4294, "step": 5135 }, { "epoch": 0.14, "learning_rate": 1.9369230269568116e-05, "loss": 1.3594, "step": 5136 }, { "epoch": 0.14, "learning_rate": 1.9368921066031366e-05, "loss": 1.4556, "step": 5137 }, { "epoch": 0.14, "learning_rate": 1.936861178919658e-05, "loss": 1.2996, "step": 5138 }, { "epoch": 0.14, "learning_rate": 1.9368302439066184e-05, "loss": 1.3994, "step": 5139 }, { "epoch": 0.14, "learning_rate": 1.936799301564259e-05, "loss": 1.4597, "step": 5140 }, { "epoch": 0.14, "learning_rate": 1.9367683518928228e-05, "loss": 1.5454, "step": 5141 }, { "epoch": 0.14, "learning_rate": 1.936737394892551e-05, "loss": 1.5183, "step": 5142 }, { "epoch": 0.14, "learning_rate": 1.9367064305636868e-05, "loss": 1.3062, "step": 5143 }, { "epoch": 0.14, "learning_rate": 1.936675458906472e-05, "loss": 1.3562, "step": 5144 }, { "epoch": 0.14, "learning_rate": 1.9366444799211485e-05, "loss": 1.5203, "step": 5145 }, { "epoch": 0.14, "learning_rate": 1.9366134936079594e-05, "loss": 1.5259, "step": 5146 }, { "epoch": 0.14, "learning_rate": 1.9365824999671465e-05, "loss": 1.4473, "step": 5147 }, { "epoch": 0.14, "learning_rate": 1.9365514989989528e-05, "loss": 1.4438, "step": 5148 }, { "epoch": 0.14, "learning_rate": 1.9365204907036202e-05, "loss": 1.4771, "step": 5149 }, { "epoch": 0.14, "learning_rate": 1.936489475081392e-05, "loss": 1.4092, "step": 5150 }, { "epoch": 0.14, "learning_rate": 1.9364584521325103e-05, "loss": 1.3274, "step": 5151 }, { "epoch": 0.14, "learning_rate": 1.936427421857218e-05, "loss": 1.3188, "step": 5152 }, { "epoch": 0.14, "learning_rate": 1.936396384255758e-05, "loss": 1.2212, "step": 5153 }, { "epoch": 0.14, "learning_rate": 1.936365339328373e-05, "loss": 1.4897, "step": 5154 }, { "epoch": 0.14, "learning_rate": 1.9363342870753058e-05, "loss": 1.8135, "step": 5155 }, { "epoch": 0.14, "learning_rate": 1.9363032274967994e-05, "loss": 1.374, "step": 5156 }, { "epoch": 0.14, "learning_rate": 1.936272160593097e-05, "loss": 1.4763, "step": 5157 }, { "epoch": 0.14, "learning_rate": 1.9362410863644415e-05, "loss": 1.325, "step": 5158 }, { "epoch": 0.14, "learning_rate": 1.936210004811076e-05, "loss": 1.4678, "step": 5159 }, { "epoch": 0.14, "learning_rate": 1.9361789159332435e-05, "loss": 1.3657, "step": 5160 }, { "epoch": 0.14, "learning_rate": 1.9361478197311874e-05, "loss": 1.7803, "step": 5161 }, { "epoch": 0.14, "learning_rate": 1.936116716205151e-05, "loss": 1.4741, "step": 5162 }, { "epoch": 0.14, "learning_rate": 1.936085605355378e-05, "loss": 1.3684, "step": 5163 }, { "epoch": 0.14, "learning_rate": 1.9360544871821108e-05, "loss": 1.2585, "step": 5164 }, { "epoch": 0.14, "learning_rate": 1.9360233616855937e-05, "loss": 1.5632, "step": 5165 }, { "epoch": 0.14, "learning_rate": 1.93599222886607e-05, "loss": 1.2795, "step": 5166 }, { "epoch": 0.14, "learning_rate": 1.935961088723783e-05, "loss": 1.2925, "step": 5167 }, { "epoch": 0.14, "learning_rate": 1.935929941258977e-05, "loss": 1.5737, "step": 5168 }, { "epoch": 0.14, "learning_rate": 1.9358987864718948e-05, "loss": 1.5542, "step": 5169 }, { "epoch": 0.14, "learning_rate": 1.9358676243627807e-05, "loss": 1.3726, "step": 5170 }, { "epoch": 0.14, "learning_rate": 1.9358364549318785e-05, "loss": 1.4045, "step": 5171 }, { "epoch": 0.14, "learning_rate": 1.935805278179432e-05, "loss": 1.3276, "step": 5172 }, { "epoch": 0.14, "learning_rate": 1.935774094105685e-05, "loss": 1.322, "step": 5173 }, { "epoch": 0.14, "learning_rate": 1.9357429027108813e-05, "loss": 1.4399, "step": 5174 }, { "epoch": 0.14, "learning_rate": 1.9357117039952655e-05, "loss": 1.3479, "step": 5175 }, { "epoch": 0.14, "learning_rate": 1.935680497959081e-05, "loss": 1.364, "step": 5176 }, { "epoch": 0.14, "learning_rate": 1.9356492846025725e-05, "loss": 1.4709, "step": 5177 }, { "epoch": 0.14, "learning_rate": 1.935618063925984e-05, "loss": 1.4736, "step": 5178 }, { "epoch": 0.14, "learning_rate": 1.9355868359295596e-05, "loss": 1.4456, "step": 5179 }, { "epoch": 0.14, "learning_rate": 1.9355556006135437e-05, "loss": 1.4492, "step": 5180 }, { "epoch": 0.14, "learning_rate": 1.9355243579781806e-05, "loss": 1.4512, "step": 5181 }, { "epoch": 0.14, "learning_rate": 1.9354931080237152e-05, "loss": 1.2644, "step": 5182 }, { "epoch": 0.14, "learning_rate": 1.9354618507503912e-05, "loss": 1.3928, "step": 5183 }, { "epoch": 0.14, "learning_rate": 1.9354305861584542e-05, "loss": 1.3381, "step": 5184 }, { "epoch": 0.14, "learning_rate": 1.9353993142481474e-05, "loss": 1.4287, "step": 5185 }, { "epoch": 0.14, "learning_rate": 1.9353680350197166e-05, "loss": 1.8306, "step": 5186 }, { "epoch": 0.14, "learning_rate": 1.9353367484734062e-05, "loss": 1.3333, "step": 5187 }, { "epoch": 0.14, "learning_rate": 1.935305454609461e-05, "loss": 1.3999, "step": 5188 }, { "epoch": 0.14, "learning_rate": 1.9352741534281255e-05, "loss": 1.4258, "step": 5189 }, { "epoch": 0.14, "learning_rate": 1.9352428449296448e-05, "loss": 1.5166, "step": 5190 }, { "epoch": 0.14, "learning_rate": 1.935211529114264e-05, "loss": 1.2832, "step": 5191 }, { "epoch": 0.14, "learning_rate": 1.9351802059822277e-05, "loss": 1.2842, "step": 5192 }, { "epoch": 0.14, "learning_rate": 1.9351488755337815e-05, "loss": 1.2407, "step": 5193 }, { "epoch": 0.14, "learning_rate": 1.9351175377691703e-05, "loss": 1.3157, "step": 5194 }, { "epoch": 0.14, "learning_rate": 1.935086192688639e-05, "loss": 1.4717, "step": 5195 }, { "epoch": 0.14, "learning_rate": 1.9350548402924332e-05, "loss": 1.3987, "step": 5196 }, { "epoch": 0.14, "learning_rate": 1.935023480580798e-05, "loss": 1.5874, "step": 5197 }, { "epoch": 0.14, "learning_rate": 1.9349921135539786e-05, "loss": 1.2808, "step": 5198 }, { "epoch": 0.14, "learning_rate": 1.9349607392122208e-05, "loss": 1.1873, "step": 5199 }, { "epoch": 0.14, "learning_rate": 1.9349293575557694e-05, "loss": 1.4219, "step": 5200 }, { "epoch": 0.14, "learning_rate": 1.9348979685848706e-05, "loss": 1.5649, "step": 5201 }, { "epoch": 0.14, "learning_rate": 1.93486657229977e-05, "loss": 1.4248, "step": 5202 }, { "epoch": 0.14, "learning_rate": 1.9348351687007124e-05, "loss": 1.4719, "step": 5203 }, { "epoch": 0.14, "learning_rate": 1.9348037577879446e-05, "loss": 1.76, "step": 5204 }, { "epoch": 0.14, "learning_rate": 1.9347723395617117e-05, "loss": 1.3442, "step": 5205 }, { "epoch": 0.14, "learning_rate": 1.934740914022259e-05, "loss": 1.4397, "step": 5206 }, { "epoch": 0.14, "learning_rate": 1.934709481169833e-05, "loss": 1.5034, "step": 5207 }, { "epoch": 0.14, "learning_rate": 1.93467804100468e-05, "loss": 1.3152, "step": 5208 }, { "epoch": 0.14, "learning_rate": 1.9346465935270456e-05, "loss": 1.5127, "step": 5209 }, { "epoch": 0.14, "learning_rate": 1.9346151387371755e-05, "loss": 1.4414, "step": 5210 }, { "epoch": 0.14, "learning_rate": 1.934583676635316e-05, "loss": 1.3733, "step": 5211 }, { "epoch": 0.14, "learning_rate": 1.9345522072217134e-05, "loss": 1.4067, "step": 5212 }, { "epoch": 0.14, "learning_rate": 1.9345207304966137e-05, "loss": 1.406, "step": 5213 }, { "epoch": 0.14, "learning_rate": 1.9344892464602633e-05, "loss": 1.4453, "step": 5214 }, { "epoch": 0.14, "learning_rate": 1.9344577551129083e-05, "loss": 1.446, "step": 5215 }, { "epoch": 0.14, "learning_rate": 1.9344262564547954e-05, "loss": 1.4248, "step": 5216 }, { "epoch": 0.14, "learning_rate": 1.934394750486171e-05, "loss": 1.3748, "step": 5217 }, { "epoch": 0.14, "learning_rate": 1.9343632372072815e-05, "loss": 1.342, "step": 5218 }, { "epoch": 0.14, "learning_rate": 1.934331716618373e-05, "loss": 1.4707, "step": 5219 }, { "epoch": 0.14, "learning_rate": 1.934300188719693e-05, "loss": 1.4963, "step": 5220 }, { "epoch": 0.14, "learning_rate": 1.9342686535114872e-05, "loss": 1.4231, "step": 5221 }, { "epoch": 0.14, "learning_rate": 1.9342371109940032e-05, "loss": 1.4429, "step": 5222 }, { "epoch": 0.14, "learning_rate": 1.9342055611674867e-05, "loss": 1.8315, "step": 5223 }, { "epoch": 0.14, "learning_rate": 1.934174004032186e-05, "loss": 1.541, "step": 5224 }, { "epoch": 0.14, "learning_rate": 1.9341424395883467e-05, "loss": 1.2825, "step": 5225 }, { "epoch": 0.14, "learning_rate": 1.934110867836216e-05, "loss": 1.394, "step": 5226 }, { "epoch": 0.14, "learning_rate": 1.9340792887760417e-05, "loss": 1.3457, "step": 5227 }, { "epoch": 0.14, "learning_rate": 1.93404770240807e-05, "loss": 1.4639, "step": 5228 }, { "epoch": 0.14, "learning_rate": 1.9340161087325483e-05, "loss": 1.405, "step": 5229 }, { "epoch": 0.14, "learning_rate": 1.9339845077497237e-05, "loss": 1.4736, "step": 5230 }, { "epoch": 0.14, "learning_rate": 1.9339528994598433e-05, "loss": 1.2115, "step": 5231 }, { "epoch": 0.14, "learning_rate": 1.933921283863155e-05, "loss": 1.5583, "step": 5232 }, { "epoch": 0.14, "learning_rate": 1.9338896609599056e-05, "loss": 1.4697, "step": 5233 }, { "epoch": 0.14, "learning_rate": 1.9338580307503426e-05, "loss": 1.4404, "step": 5234 }, { "epoch": 0.14, "learning_rate": 1.9338263932347135e-05, "loss": 1.2368, "step": 5235 }, { "epoch": 0.14, "learning_rate": 1.933794748413266e-05, "loss": 1.5127, "step": 5236 }, { "epoch": 0.14, "learning_rate": 1.933763096286247e-05, "loss": 1.4399, "step": 5237 }, { "epoch": 0.14, "learning_rate": 1.9337314368539052e-05, "loss": 1.3093, "step": 5238 }, { "epoch": 0.14, "learning_rate": 1.9336997701164875e-05, "loss": 1.3999, "step": 5239 }, { "epoch": 0.14, "learning_rate": 1.9336680960742417e-05, "loss": 1.3508, "step": 5240 }, { "epoch": 0.14, "learning_rate": 1.933636414727416e-05, "loss": 1.2639, "step": 5241 }, { "epoch": 0.14, "learning_rate": 1.9336047260762577e-05, "loss": 1.3784, "step": 5242 }, { "epoch": 0.14, "learning_rate": 1.933573030121015e-05, "loss": 1.5771, "step": 5243 }, { "epoch": 0.14, "learning_rate": 1.9335413268619362e-05, "loss": 1.4175, "step": 5244 }, { "epoch": 0.14, "learning_rate": 1.933509616299269e-05, "loss": 1.5208, "step": 5245 }, { "epoch": 0.14, "learning_rate": 1.9334778984332617e-05, "loss": 1.4941, "step": 5246 }, { "epoch": 0.14, "learning_rate": 1.933446173264162e-05, "loss": 1.427, "step": 5247 }, { "epoch": 0.14, "learning_rate": 1.9334144407922182e-05, "loss": 1.1792, "step": 5248 }, { "epoch": 0.14, "learning_rate": 1.9333827010176794e-05, "loss": 1.416, "step": 5249 }, { "epoch": 0.14, "learning_rate": 1.9333509539407926e-05, "loss": 1.4722, "step": 5250 }, { "epoch": 0.14, "learning_rate": 1.9333191995618073e-05, "loss": 1.3931, "step": 5251 }, { "epoch": 0.14, "learning_rate": 1.933287437880971e-05, "loss": 1.7959, "step": 5252 }, { "epoch": 0.14, "learning_rate": 1.9332556688985332e-05, "loss": 1.4382, "step": 5253 }, { "epoch": 0.14, "learning_rate": 1.9332238926147412e-05, "loss": 1.4749, "step": 5254 }, { "epoch": 0.14, "learning_rate": 1.933192109029845e-05, "loss": 1.4399, "step": 5255 }, { "epoch": 0.14, "learning_rate": 1.933160318144092e-05, "loss": 1.2192, "step": 5256 }, { "epoch": 0.14, "learning_rate": 1.9331285199577318e-05, "loss": 1.3867, "step": 5257 }, { "epoch": 0.14, "learning_rate": 1.9330967144710126e-05, "loss": 1.6611, "step": 5258 }, { "epoch": 0.14, "learning_rate": 1.933064901684184e-05, "loss": 1.4897, "step": 5259 }, { "epoch": 0.14, "learning_rate": 1.9330330815974938e-05, "loss": 1.4941, "step": 5260 }, { "epoch": 0.14, "learning_rate": 1.9330012542111917e-05, "loss": 1.481, "step": 5261 }, { "epoch": 0.14, "learning_rate": 1.9329694195255263e-05, "loss": 1.5972, "step": 5262 }, { "epoch": 0.14, "learning_rate": 1.9329375775407472e-05, "loss": 1.4526, "step": 5263 }, { "epoch": 0.14, "learning_rate": 1.932905728257103e-05, "loss": 1.4922, "step": 5264 }, { "epoch": 0.14, "learning_rate": 1.9328738716748435e-05, "loss": 1.4207, "step": 5265 }, { "epoch": 0.14, "learning_rate": 1.932842007794217e-05, "loss": 1.3938, "step": 5266 }, { "epoch": 0.14, "learning_rate": 1.9328101366154733e-05, "loss": 1.3203, "step": 5267 }, { "epoch": 0.14, "learning_rate": 1.9327782581388618e-05, "loss": 1.2493, "step": 5268 }, { "epoch": 0.14, "learning_rate": 1.932746372364632e-05, "loss": 1.322, "step": 5269 }, { "epoch": 0.14, "learning_rate": 1.932714479293033e-05, "loss": 1.3269, "step": 5270 }, { "epoch": 0.14, "learning_rate": 1.932682578924315e-05, "loss": 1.4978, "step": 5271 }, { "epoch": 0.14, "learning_rate": 1.9326506712587265e-05, "loss": 1.459, "step": 5272 }, { "epoch": 0.14, "learning_rate": 1.9326187562965177e-05, "loss": 1.3911, "step": 5273 }, { "epoch": 0.14, "learning_rate": 1.9325868340379387e-05, "loss": 1.4326, "step": 5274 }, { "epoch": 0.14, "learning_rate": 1.9325549044832387e-05, "loss": 1.2253, "step": 5275 }, { "epoch": 0.14, "learning_rate": 1.9325229676326676e-05, "loss": 1.4021, "step": 5276 }, { "epoch": 0.14, "learning_rate": 1.9324910234864753e-05, "loss": 1.4231, "step": 5277 }, { "epoch": 0.14, "learning_rate": 1.9324590720449115e-05, "loss": 1.4343, "step": 5278 }, { "epoch": 0.14, "learning_rate": 1.9324271133082267e-05, "loss": 1.6494, "step": 5279 }, { "epoch": 0.14, "learning_rate": 1.9323951472766706e-05, "loss": 1.3977, "step": 5280 }, { "epoch": 0.14, "learning_rate": 1.932363173950493e-05, "loss": 1.4832, "step": 5281 }, { "epoch": 0.14, "learning_rate": 1.9323311933299447e-05, "loss": 1.5352, "step": 5282 }, { "epoch": 0.14, "learning_rate": 1.9322992054152754e-05, "loss": 1.4468, "step": 5283 }, { "epoch": 0.14, "learning_rate": 1.9322672102067356e-05, "loss": 1.3857, "step": 5284 }, { "epoch": 0.14, "learning_rate": 1.9322352077045753e-05, "loss": 1.3916, "step": 5285 }, { "epoch": 0.14, "learning_rate": 1.9322031979090453e-05, "loss": 1.4138, "step": 5286 }, { "epoch": 0.14, "learning_rate": 1.932171180820396e-05, "loss": 1.4346, "step": 5287 }, { "epoch": 0.14, "learning_rate": 1.9321391564388773e-05, "loss": 1.2568, "step": 5288 }, { "epoch": 0.14, "learning_rate": 1.9321071247647407e-05, "loss": 1.5601, "step": 5289 }, { "epoch": 0.14, "learning_rate": 1.932075085798236e-05, "loss": 1.3887, "step": 5290 }, { "epoch": 0.14, "learning_rate": 1.932043039539614e-05, "loss": 1.2825, "step": 5291 }, { "epoch": 0.14, "learning_rate": 1.9320109859891256e-05, "loss": 1.502, "step": 5292 }, { "epoch": 0.14, "learning_rate": 1.9319789251470212e-05, "loss": 1.2942, "step": 5293 }, { "epoch": 0.14, "learning_rate": 1.9319468570135528e-05, "loss": 1.4453, "step": 5294 }, { "epoch": 0.14, "learning_rate": 1.9319147815889695e-05, "loss": 1.5103, "step": 5295 }, { "epoch": 0.14, "learning_rate": 1.9318826988735237e-05, "loss": 1.4268, "step": 5296 }, { "epoch": 0.14, "learning_rate": 1.9318506088674657e-05, "loss": 1.3989, "step": 5297 }, { "epoch": 0.14, "learning_rate": 1.9318185115710467e-05, "loss": 1.3425, "step": 5298 }, { "epoch": 0.14, "learning_rate": 1.931786406984518e-05, "loss": 1.4287, "step": 5299 }, { "epoch": 0.14, "learning_rate": 1.9317542951081306e-05, "loss": 1.5796, "step": 5300 }, { "epoch": 0.14, "learning_rate": 1.9317221759421354e-05, "loss": 1.2738, "step": 5301 }, { "epoch": 0.14, "learning_rate": 1.9316900494867844e-05, "loss": 1.3147, "step": 5302 }, { "epoch": 0.14, "learning_rate": 1.9316579157423282e-05, "loss": 1.4221, "step": 5303 }, { "epoch": 0.14, "learning_rate": 1.9316257747090187e-05, "loss": 1.5537, "step": 5304 }, { "epoch": 0.14, "learning_rate": 1.9315936263871076e-05, "loss": 1.4146, "step": 5305 }, { "epoch": 0.14, "learning_rate": 1.9315614707768456e-05, "loss": 1.3479, "step": 5306 }, { "epoch": 0.14, "learning_rate": 1.931529307878485e-05, "loss": 1.4453, "step": 5307 }, { "epoch": 0.14, "learning_rate": 1.9314971376922768e-05, "loss": 1.3899, "step": 5308 }, { "epoch": 0.14, "learning_rate": 1.9314649602184735e-05, "loss": 1.3086, "step": 5309 }, { "epoch": 0.15, "learning_rate": 1.9314327754573256e-05, "loss": 1.4622, "step": 5310 }, { "epoch": 0.15, "learning_rate": 1.9314005834090862e-05, "loss": 1.4385, "step": 5311 }, { "epoch": 0.15, "learning_rate": 1.9313683840740066e-05, "loss": 1.4067, "step": 5312 }, { "epoch": 0.15, "learning_rate": 1.9313361774523387e-05, "loss": 1.3367, "step": 5313 }, { "epoch": 0.15, "learning_rate": 1.9313039635443344e-05, "loss": 1.4854, "step": 5314 }, { "epoch": 0.15, "learning_rate": 1.9312717423502456e-05, "loss": 1.3604, "step": 5315 }, { "epoch": 0.15, "learning_rate": 1.931239513870325e-05, "loss": 1.3206, "step": 5316 }, { "epoch": 0.15, "learning_rate": 1.9312072781048245e-05, "loss": 1.2908, "step": 5317 }, { "epoch": 0.15, "learning_rate": 1.9311750350539954e-05, "loss": 1.5, "step": 5318 }, { "epoch": 0.15, "learning_rate": 1.9311427847180914e-05, "loss": 1.4075, "step": 5319 }, { "epoch": 0.15, "learning_rate": 1.9311105270973635e-05, "loss": 1.426, "step": 5320 }, { "epoch": 0.15, "learning_rate": 1.9310782621920652e-05, "loss": 1.4199, "step": 5321 }, { "epoch": 0.15, "learning_rate": 1.9310459900024482e-05, "loss": 1.2861, "step": 5322 }, { "epoch": 0.15, "learning_rate": 1.9310137105287653e-05, "loss": 1.4705, "step": 5323 }, { "epoch": 0.15, "learning_rate": 1.9309814237712686e-05, "loss": 1.5386, "step": 5324 }, { "epoch": 0.15, "learning_rate": 1.930949129730211e-05, "loss": 1.4653, "step": 5325 }, { "epoch": 0.15, "learning_rate": 1.9309168284058456e-05, "loss": 1.4155, "step": 5326 }, { "epoch": 0.15, "learning_rate": 1.9308845197984245e-05, "loss": 1.542, "step": 5327 }, { "epoch": 0.15, "learning_rate": 1.930852203908201e-05, "loss": 1.3896, "step": 5328 }, { "epoch": 0.15, "learning_rate": 1.930819880735427e-05, "loss": 1.4202, "step": 5329 }, { "epoch": 0.15, "learning_rate": 1.9307875502803562e-05, "loss": 1.4424, "step": 5330 }, { "epoch": 0.15, "learning_rate": 1.9307552125432413e-05, "loss": 1.3713, "step": 5331 }, { "epoch": 0.15, "learning_rate": 1.930722867524335e-05, "loss": 1.481, "step": 5332 }, { "epoch": 0.15, "learning_rate": 1.9306905152238912e-05, "loss": 1.4141, "step": 5333 }, { "epoch": 0.15, "learning_rate": 1.930658155642162e-05, "loss": 1.561, "step": 5334 }, { "epoch": 0.15, "learning_rate": 1.930625788779401e-05, "loss": 1.3943, "step": 5335 }, { "epoch": 0.15, "learning_rate": 1.9305934146358617e-05, "loss": 1.3062, "step": 5336 }, { "epoch": 0.15, "learning_rate": 1.930561033211797e-05, "loss": 1.3745, "step": 5337 }, { "epoch": 0.15, "learning_rate": 1.9305286445074602e-05, "loss": 1.7793, "step": 5338 }, { "epoch": 0.15, "learning_rate": 1.9304962485231052e-05, "loss": 1.4299, "step": 5339 }, { "epoch": 0.15, "learning_rate": 1.9304638452589848e-05, "loss": 1.49, "step": 5340 }, { "epoch": 0.15, "learning_rate": 1.930431434715353e-05, "loss": 1.5142, "step": 5341 }, { "epoch": 0.15, "learning_rate": 1.930399016892463e-05, "loss": 1.502, "step": 5342 }, { "epoch": 0.15, "learning_rate": 1.930366591790569e-05, "loss": 1.396, "step": 5343 }, { "epoch": 0.15, "learning_rate": 1.9303341594099237e-05, "loss": 1.4463, "step": 5344 }, { "epoch": 0.15, "learning_rate": 1.930301719750782e-05, "loss": 1.3975, "step": 5345 }, { "epoch": 0.15, "learning_rate": 1.9302692728133966e-05, "loss": 1.5078, "step": 5346 }, { "epoch": 0.15, "learning_rate": 1.9302368185980218e-05, "loss": 1.3047, "step": 5347 }, { "epoch": 0.15, "learning_rate": 1.930204357104912e-05, "loss": 1.4192, "step": 5348 }, { "epoch": 0.15, "learning_rate": 1.9301718883343204e-05, "loss": 1.4082, "step": 5349 }, { "epoch": 0.15, "learning_rate": 1.9301394122865017e-05, "loss": 1.3223, "step": 5350 }, { "epoch": 0.15, "learning_rate": 1.930106928961709e-05, "loss": 1.2661, "step": 5351 }, { "epoch": 0.15, "learning_rate": 1.9300744383601974e-05, "loss": 1.3267, "step": 5352 }, { "epoch": 0.15, "learning_rate": 1.930041940482221e-05, "loss": 1.2876, "step": 5353 }, { "epoch": 0.15, "learning_rate": 1.9300094353280338e-05, "loss": 1.2642, "step": 5354 }, { "epoch": 0.15, "learning_rate": 1.9299769228978897e-05, "loss": 1.5449, "step": 5355 }, { "epoch": 0.15, "learning_rate": 1.9299444031920437e-05, "loss": 1.3806, "step": 5356 }, { "epoch": 0.15, "learning_rate": 1.92991187621075e-05, "loss": 1.4236, "step": 5357 }, { "epoch": 0.15, "learning_rate": 1.929879341954263e-05, "loss": 1.3403, "step": 5358 }, { "epoch": 0.15, "learning_rate": 1.929846800422837e-05, "loss": 1.438, "step": 5359 }, { "epoch": 0.15, "learning_rate": 1.929814251616727e-05, "loss": 1.4216, "step": 5360 }, { "epoch": 0.15, "learning_rate": 1.929781695536188e-05, "loss": 1.4019, "step": 5361 }, { "epoch": 0.15, "learning_rate": 1.9297491321814737e-05, "loss": 1.4104, "step": 5362 }, { "epoch": 0.15, "learning_rate": 1.9297165615528397e-05, "loss": 1.5015, "step": 5363 }, { "epoch": 0.15, "learning_rate": 1.9296839836505403e-05, "loss": 1.4155, "step": 5364 }, { "epoch": 0.15, "learning_rate": 1.929651398474831e-05, "loss": 1.3301, "step": 5365 }, { "epoch": 0.15, "learning_rate": 1.9296188060259656e-05, "loss": 1.387, "step": 5366 }, { "epoch": 0.15, "learning_rate": 1.9295862063042005e-05, "loss": 1.4963, "step": 5367 }, { "epoch": 0.15, "learning_rate": 1.9295535993097895e-05, "loss": 1.3574, "step": 5368 }, { "epoch": 0.15, "learning_rate": 1.9295209850429884e-05, "loss": 1.4941, "step": 5369 }, { "epoch": 0.15, "learning_rate": 1.9294883635040523e-05, "loss": 1.5103, "step": 5370 }, { "epoch": 0.15, "learning_rate": 1.9294557346932365e-05, "loss": 1.5481, "step": 5371 }, { "epoch": 0.15, "learning_rate": 1.929423098610796e-05, "loss": 1.4556, "step": 5372 }, { "epoch": 0.15, "learning_rate": 1.9293904552569857e-05, "loss": 1.3699, "step": 5373 }, { "epoch": 0.15, "learning_rate": 1.929357804632062e-05, "loss": 1.2588, "step": 5374 }, { "epoch": 0.15, "learning_rate": 1.92932514673628e-05, "loss": 1.4434, "step": 5375 }, { "epoch": 0.15, "learning_rate": 1.9292924815698947e-05, "loss": 1.3079, "step": 5376 }, { "epoch": 0.15, "learning_rate": 1.929259809133162e-05, "loss": 1.4277, "step": 5377 }, { "epoch": 0.15, "learning_rate": 1.929227129426338e-05, "loss": 1.438, "step": 5378 }, { "epoch": 0.15, "learning_rate": 1.9291944424496773e-05, "loss": 1.6572, "step": 5379 }, { "epoch": 0.15, "learning_rate": 1.9291617482034365e-05, "loss": 1.541, "step": 5380 }, { "epoch": 0.15, "learning_rate": 1.929129046687871e-05, "loss": 1.3979, "step": 5381 }, { "epoch": 0.15, "learning_rate": 1.929096337903237e-05, "loss": 1.345, "step": 5382 }, { "epoch": 0.15, "learning_rate": 1.9290636218497898e-05, "loss": 1.7834, "step": 5383 }, { "epoch": 0.15, "learning_rate": 1.9290308985277858e-05, "loss": 1.3013, "step": 5384 }, { "epoch": 0.15, "learning_rate": 1.9289981679374808e-05, "loss": 1.4104, "step": 5385 }, { "epoch": 0.15, "learning_rate": 1.9289654300791313e-05, "loss": 1.2959, "step": 5386 }, { "epoch": 0.15, "learning_rate": 1.928932684952993e-05, "loss": 1.4351, "step": 5387 }, { "epoch": 0.15, "learning_rate": 1.9288999325593222e-05, "loss": 1.3782, "step": 5388 }, { "epoch": 0.15, "learning_rate": 1.9288671728983752e-05, "loss": 1.3691, "step": 5389 }, { "epoch": 0.15, "learning_rate": 1.928834405970408e-05, "loss": 1.4116, "step": 5390 }, { "epoch": 0.15, "learning_rate": 1.9288016317756773e-05, "loss": 1.3247, "step": 5391 }, { "epoch": 0.15, "learning_rate": 1.9287688503144393e-05, "loss": 1.4731, "step": 5392 }, { "epoch": 0.15, "learning_rate": 1.9287360615869506e-05, "loss": 1.3223, "step": 5393 }, { "epoch": 0.15, "learning_rate": 1.9287032655934675e-05, "loss": 1.4707, "step": 5394 }, { "epoch": 0.15, "learning_rate": 1.9286704623342473e-05, "loss": 1.3127, "step": 5395 }, { "epoch": 0.15, "learning_rate": 1.9286376518095454e-05, "loss": 1.4031, "step": 5396 }, { "epoch": 0.15, "learning_rate": 1.9286048340196197e-05, "loss": 1.4565, "step": 5397 }, { "epoch": 0.15, "learning_rate": 1.9285720089647262e-05, "loss": 1.207, "step": 5398 }, { "epoch": 0.15, "learning_rate": 1.928539176645122e-05, "loss": 1.5034, "step": 5399 }, { "epoch": 0.15, "learning_rate": 1.9285063370610638e-05, "loss": 1.5874, "step": 5400 }, { "epoch": 0.15, "learning_rate": 1.928473490212809e-05, "loss": 1.4397, "step": 5401 }, { "epoch": 0.15, "learning_rate": 1.9284406361006138e-05, "loss": 1.3884, "step": 5402 }, { "epoch": 0.15, "learning_rate": 1.928407774724736e-05, "loss": 1.302, "step": 5403 }, { "epoch": 0.15, "learning_rate": 1.928374906085432e-05, "loss": 1.5195, "step": 5404 }, { "epoch": 0.15, "learning_rate": 1.9283420301829597e-05, "loss": 1.5552, "step": 5405 }, { "epoch": 0.15, "learning_rate": 1.9283091470175755e-05, "loss": 1.4292, "step": 5406 }, { "epoch": 0.15, "learning_rate": 1.928276256589537e-05, "loss": 1.2983, "step": 5407 }, { "epoch": 0.15, "learning_rate": 1.9282433588991018e-05, "loss": 1.354, "step": 5408 }, { "epoch": 0.15, "learning_rate": 1.9282104539465273e-05, "loss": 1.3652, "step": 5409 }, { "epoch": 0.15, "learning_rate": 1.9281775417320703e-05, "loss": 1.3542, "step": 5410 }, { "epoch": 0.15, "learning_rate": 1.9281446222559886e-05, "loss": 1.29, "step": 5411 }, { "epoch": 0.15, "learning_rate": 1.92811169551854e-05, "loss": 1.4377, "step": 5412 }, { "epoch": 0.15, "learning_rate": 1.928078761519982e-05, "loss": 1.3894, "step": 5413 }, { "epoch": 0.15, "learning_rate": 1.9280458202605722e-05, "loss": 1.3872, "step": 5414 }, { "epoch": 0.15, "learning_rate": 1.9280128717405683e-05, "loss": 1.5518, "step": 5415 }, { "epoch": 0.15, "learning_rate": 1.9279799159602276e-05, "loss": 1.5342, "step": 5416 }, { "epoch": 0.15, "learning_rate": 1.927946952919809e-05, "loss": 1.4707, "step": 5417 }, { "epoch": 0.15, "learning_rate": 1.9279139826195696e-05, "loss": 1.478, "step": 5418 }, { "epoch": 0.15, "learning_rate": 1.9278810050597672e-05, "loss": 1.4888, "step": 5419 }, { "epoch": 0.15, "learning_rate": 1.9278480202406607e-05, "loss": 1.3794, "step": 5420 }, { "epoch": 0.15, "learning_rate": 1.9278150281625073e-05, "loss": 1.4141, "step": 5421 }, { "epoch": 0.15, "learning_rate": 1.9277820288255654e-05, "loss": 1.5449, "step": 5422 }, { "epoch": 0.15, "learning_rate": 1.9277490222300933e-05, "loss": 1.416, "step": 5423 }, { "epoch": 0.15, "learning_rate": 1.9277160083763488e-05, "loss": 1.4143, "step": 5424 }, { "epoch": 0.15, "learning_rate": 1.9276829872645906e-05, "loss": 1.3032, "step": 5425 }, { "epoch": 0.15, "learning_rate": 1.9276499588950775e-05, "loss": 1.3381, "step": 5426 }, { "epoch": 0.15, "learning_rate": 1.9276169232680668e-05, "loss": 1.46, "step": 5427 }, { "epoch": 0.15, "learning_rate": 1.9275838803838173e-05, "loss": 1.3047, "step": 5428 }, { "epoch": 0.15, "learning_rate": 1.9275508302425884e-05, "loss": 1.4771, "step": 5429 }, { "epoch": 0.15, "learning_rate": 1.927517772844637e-05, "loss": 1.3103, "step": 5430 }, { "epoch": 0.15, "learning_rate": 1.9274847081902237e-05, "loss": 1.5063, "step": 5431 }, { "epoch": 0.15, "learning_rate": 1.9274516362796057e-05, "loss": 1.3948, "step": 5432 }, { "epoch": 0.15, "learning_rate": 1.927418557113042e-05, "loss": 1.4893, "step": 5433 }, { "epoch": 0.15, "learning_rate": 1.927385470690792e-05, "loss": 1.5168, "step": 5434 }, { "epoch": 0.15, "learning_rate": 1.9273523770131142e-05, "loss": 1.4819, "step": 5435 }, { "epoch": 0.15, "learning_rate": 1.927319276080267e-05, "loss": 1.4221, "step": 5436 }, { "epoch": 0.15, "learning_rate": 1.9272861678925103e-05, "loss": 1.3936, "step": 5437 }, { "epoch": 0.15, "learning_rate": 1.9272530524501027e-05, "loss": 1.2207, "step": 5438 }, { "epoch": 0.15, "learning_rate": 1.9272199297533027e-05, "loss": 1.3228, "step": 5439 }, { "epoch": 0.15, "learning_rate": 1.9271867998023703e-05, "loss": 1.3647, "step": 5440 }, { "epoch": 0.15, "learning_rate": 1.9271536625975646e-05, "loss": 1.3855, "step": 5441 }, { "epoch": 0.15, "learning_rate": 1.927120518139144e-05, "loss": 1.4011, "step": 5442 }, { "epoch": 0.15, "learning_rate": 1.927087366427369e-05, "loss": 1.3933, "step": 5443 }, { "epoch": 0.15, "learning_rate": 1.927054207462498e-05, "loss": 1.4363, "step": 5444 }, { "epoch": 0.15, "learning_rate": 1.9270210412447913e-05, "loss": 1.4268, "step": 5445 }, { "epoch": 0.15, "learning_rate": 1.9269878677745074e-05, "loss": 1.5144, "step": 5446 }, { "epoch": 0.15, "learning_rate": 1.926954687051907e-05, "loss": 1.2576, "step": 5447 }, { "epoch": 0.15, "learning_rate": 1.9269214990772484e-05, "loss": 1.4338, "step": 5448 }, { "epoch": 0.15, "learning_rate": 1.926888303850792e-05, "loss": 1.4392, "step": 5449 }, { "epoch": 0.15, "learning_rate": 1.9268551013727975e-05, "loss": 1.4031, "step": 5450 }, { "epoch": 0.15, "learning_rate": 1.9268218916435245e-05, "loss": 1.3462, "step": 5451 }, { "epoch": 0.15, "learning_rate": 1.9267886746632327e-05, "loss": 1.3235, "step": 5452 }, { "epoch": 0.15, "learning_rate": 1.926755450432182e-05, "loss": 1.3325, "step": 5453 }, { "epoch": 0.15, "learning_rate": 1.9267222189506327e-05, "loss": 1.4568, "step": 5454 }, { "epoch": 0.15, "learning_rate": 1.9266889802188445e-05, "loss": 1.4856, "step": 5455 }, { "epoch": 0.15, "learning_rate": 1.9266557342370773e-05, "loss": 1.4014, "step": 5456 }, { "epoch": 0.15, "learning_rate": 1.9266224810055915e-05, "loss": 1.543, "step": 5457 }, { "epoch": 0.15, "learning_rate": 1.9265892205246474e-05, "loss": 1.5415, "step": 5458 }, { "epoch": 0.15, "learning_rate": 1.9265559527945047e-05, "loss": 1.4446, "step": 5459 }, { "epoch": 0.15, "learning_rate": 1.9265226778154238e-05, "loss": 1.4639, "step": 5460 }, { "epoch": 0.15, "learning_rate": 1.926489395587665e-05, "loss": 1.2717, "step": 5461 }, { "epoch": 0.15, "learning_rate": 1.9264561061114896e-05, "loss": 1.4307, "step": 5462 }, { "epoch": 0.15, "learning_rate": 1.9264228093871567e-05, "loss": 1.4294, "step": 5463 }, { "epoch": 0.15, "learning_rate": 1.9263895054149275e-05, "loss": 1.519, "step": 5464 }, { "epoch": 0.15, "learning_rate": 1.9263561941950622e-05, "loss": 1.5356, "step": 5465 }, { "epoch": 0.15, "learning_rate": 1.9263228757278218e-05, "loss": 1.3884, "step": 5466 }, { "epoch": 0.15, "learning_rate": 1.9262895500134667e-05, "loss": 1.3635, "step": 5467 }, { "epoch": 0.15, "learning_rate": 1.926256217052258e-05, "loss": 1.5205, "step": 5468 }, { "epoch": 0.15, "learning_rate": 1.926222876844456e-05, "loss": 1.3896, "step": 5469 }, { "epoch": 0.15, "learning_rate": 1.926189529390322e-05, "loss": 1.4473, "step": 5470 }, { "epoch": 0.15, "learning_rate": 1.9261561746901166e-05, "loss": 1.5137, "step": 5471 }, { "epoch": 0.15, "learning_rate": 1.9261228127441004e-05, "loss": 1.2449, "step": 5472 }, { "epoch": 0.15, "learning_rate": 1.9260894435525352e-05, "loss": 1.407, "step": 5473 }, { "epoch": 0.15, "learning_rate": 1.9260560671156815e-05, "loss": 1.45, "step": 5474 }, { "epoch": 0.15, "learning_rate": 1.9260226834338007e-05, "loss": 1.4055, "step": 5475 }, { "epoch": 0.15, "learning_rate": 1.9259892925071536e-05, "loss": 1.3674, "step": 5476 }, { "epoch": 0.15, "learning_rate": 1.925955894336002e-05, "loss": 1.3411, "step": 5477 }, { "epoch": 0.15, "learning_rate": 1.925922488920607e-05, "loss": 1.4189, "step": 5478 }, { "epoch": 0.15, "learning_rate": 1.9258890762612296e-05, "loss": 1.4229, "step": 5479 }, { "epoch": 0.15, "learning_rate": 1.9258556563581315e-05, "loss": 1.2839, "step": 5480 }, { "epoch": 0.15, "learning_rate": 1.9258222292115742e-05, "loss": 1.5107, "step": 5481 }, { "epoch": 0.15, "learning_rate": 1.925788794821819e-05, "loss": 1.5522, "step": 5482 }, { "epoch": 0.15, "learning_rate": 1.9257553531891278e-05, "loss": 1.4612, "step": 5483 }, { "epoch": 0.15, "learning_rate": 1.9257219043137617e-05, "loss": 1.7344, "step": 5484 }, { "epoch": 0.15, "learning_rate": 1.925688448195983e-05, "loss": 1.2866, "step": 5485 }, { "epoch": 0.15, "learning_rate": 1.925654984836053e-05, "loss": 1.5176, "step": 5486 }, { "epoch": 0.15, "learning_rate": 1.925621514234234e-05, "loss": 1.3267, "step": 5487 }, { "epoch": 0.15, "learning_rate": 1.9255880363907873e-05, "loss": 1.1902, "step": 5488 }, { "epoch": 0.15, "learning_rate": 1.9255545513059754e-05, "loss": 1.4053, "step": 5489 }, { "epoch": 0.15, "learning_rate": 1.9255210589800594e-05, "loss": 1.4958, "step": 5490 }, { "epoch": 0.15, "learning_rate": 1.9254875594133022e-05, "loss": 1.425, "step": 5491 }, { "epoch": 0.15, "learning_rate": 1.9254540526059647e-05, "loss": 1.5437, "step": 5492 }, { "epoch": 0.15, "learning_rate": 1.925420538558311e-05, "loss": 1.2361, "step": 5493 }, { "epoch": 0.15, "learning_rate": 1.9253870172706017e-05, "loss": 1.7607, "step": 5494 }, { "epoch": 0.15, "learning_rate": 1.9253534887430992e-05, "loss": 1.4102, "step": 5495 }, { "epoch": 0.15, "learning_rate": 1.9253199529760668e-05, "loss": 1.3538, "step": 5496 }, { "epoch": 0.15, "learning_rate": 1.9252864099697656e-05, "loss": 1.2478, "step": 5497 }, { "epoch": 0.15, "learning_rate": 1.9252528597244587e-05, "loss": 1.4551, "step": 5498 }, { "epoch": 0.15, "learning_rate": 1.925219302240409e-05, "loss": 1.376, "step": 5499 }, { "epoch": 0.15, "learning_rate": 1.925185737517878e-05, "loss": 1.51, "step": 5500 }, { "epoch": 0.15, "learning_rate": 1.925152165557129e-05, "loss": 1.4897, "step": 5501 }, { "epoch": 0.15, "learning_rate": 1.9251185863584247e-05, "loss": 1.46, "step": 5502 }, { "epoch": 0.15, "learning_rate": 1.9250849999220275e-05, "loss": 1.4248, "step": 5503 }, { "epoch": 0.15, "learning_rate": 1.9250514062482005e-05, "loss": 1.3967, "step": 5504 }, { "epoch": 0.15, "learning_rate": 1.9250178053372058e-05, "loss": 1.3572, "step": 5505 }, { "epoch": 0.15, "learning_rate": 1.924984197189307e-05, "loss": 1.4656, "step": 5506 }, { "epoch": 0.15, "learning_rate": 1.9249505818047666e-05, "loss": 1.3997, "step": 5507 }, { "epoch": 0.15, "learning_rate": 1.9249169591838482e-05, "loss": 1.426, "step": 5508 }, { "epoch": 0.15, "learning_rate": 1.9248833293268144e-05, "loss": 1.4426, "step": 5509 }, { "epoch": 0.15, "learning_rate": 1.924849692233928e-05, "loss": 1.8003, "step": 5510 }, { "epoch": 0.15, "learning_rate": 1.9248160479054524e-05, "loss": 1.5176, "step": 5511 }, { "epoch": 0.15, "learning_rate": 1.9247823963416513e-05, "loss": 1.3113, "step": 5512 }, { "epoch": 0.15, "learning_rate": 1.9247487375427875e-05, "loss": 1.4932, "step": 5513 }, { "epoch": 0.15, "learning_rate": 1.9247150715091246e-05, "loss": 1.5234, "step": 5514 }, { "epoch": 0.15, "learning_rate": 1.9246813982409255e-05, "loss": 1.4097, "step": 5515 }, { "epoch": 0.15, "learning_rate": 1.9246477177384542e-05, "loss": 1.5728, "step": 5516 }, { "epoch": 0.15, "learning_rate": 1.924614030001974e-05, "loss": 1.4788, "step": 5517 }, { "epoch": 0.15, "learning_rate": 1.924580335031748e-05, "loss": 1.3804, "step": 5518 }, { "epoch": 0.15, "learning_rate": 1.9245466328280406e-05, "loss": 1.5479, "step": 5519 }, { "epoch": 0.15, "learning_rate": 1.924512923391115e-05, "loss": 1.4556, "step": 5520 }, { "epoch": 0.15, "learning_rate": 1.9244792067212346e-05, "loss": 1.4717, "step": 5521 }, { "epoch": 0.15, "learning_rate": 1.9244454828186643e-05, "loss": 1.3972, "step": 5522 }, { "epoch": 0.15, "learning_rate": 1.924411751683667e-05, "loss": 1.3398, "step": 5523 }, { "epoch": 0.15, "learning_rate": 1.9243780133165067e-05, "loss": 1.3936, "step": 5524 }, { "epoch": 0.15, "learning_rate": 1.9243442677174477e-05, "loss": 1.3906, "step": 5525 }, { "epoch": 0.15, "learning_rate": 1.9243105148867537e-05, "loss": 1.3774, "step": 5526 }, { "epoch": 0.15, "learning_rate": 1.9242767548246887e-05, "loss": 1.4055, "step": 5527 }, { "epoch": 0.15, "learning_rate": 1.924242987531517e-05, "loss": 1.5, "step": 5528 }, { "epoch": 0.15, "learning_rate": 1.9242092130075033e-05, "loss": 1.4031, "step": 5529 }, { "epoch": 0.15, "learning_rate": 1.924175431252911e-05, "loss": 1.4429, "step": 5530 }, { "epoch": 0.15, "learning_rate": 1.9241416422680044e-05, "loss": 1.3198, "step": 5531 }, { "epoch": 0.15, "learning_rate": 1.9241078460530486e-05, "loss": 1.532, "step": 5532 }, { "epoch": 0.15, "learning_rate": 1.9240740426083075e-05, "loss": 1.3684, "step": 5533 }, { "epoch": 0.15, "learning_rate": 1.9240402319340452e-05, "loss": 1.429, "step": 5534 }, { "epoch": 0.15, "learning_rate": 1.924006414030527e-05, "loss": 1.4829, "step": 5535 }, { "epoch": 0.15, "learning_rate": 1.923972588898017e-05, "loss": 1.26, "step": 5536 }, { "epoch": 0.15, "learning_rate": 1.92393875653678e-05, "loss": 1.438, "step": 5537 }, { "epoch": 0.15, "learning_rate": 1.9239049169470805e-05, "loss": 1.4104, "step": 5538 }, { "epoch": 0.15, "learning_rate": 1.9238710701291835e-05, "loss": 1.4658, "step": 5539 }, { "epoch": 0.15, "learning_rate": 1.9238372160833537e-05, "loss": 1.3079, "step": 5540 }, { "epoch": 0.15, "learning_rate": 1.923803354809856e-05, "loss": 1.3003, "step": 5541 }, { "epoch": 0.15, "learning_rate": 1.9237694863089552e-05, "loss": 1.3103, "step": 5542 }, { "epoch": 0.15, "learning_rate": 1.9237356105809163e-05, "loss": 1.4531, "step": 5543 }, { "epoch": 0.15, "learning_rate": 1.9237017276260045e-05, "loss": 1.4146, "step": 5544 }, { "epoch": 0.15, "learning_rate": 1.9236678374444844e-05, "loss": 1.4185, "step": 5545 }, { "epoch": 0.15, "learning_rate": 1.9236339400366217e-05, "loss": 1.4976, "step": 5546 }, { "epoch": 0.15, "learning_rate": 1.9236000354026812e-05, "loss": 1.4092, "step": 5547 }, { "epoch": 0.15, "learning_rate": 1.9235661235429287e-05, "loss": 1.5327, "step": 5548 }, { "epoch": 0.15, "learning_rate": 1.923532204457629e-05, "loss": 1.4453, "step": 5549 }, { "epoch": 0.15, "learning_rate": 1.9234982781470475e-05, "loss": 1.583, "step": 5550 }, { "epoch": 0.15, "learning_rate": 1.9234643446114498e-05, "loss": 1.364, "step": 5551 }, { "epoch": 0.15, "learning_rate": 1.9234304038511014e-05, "loss": 1.2317, "step": 5552 }, { "epoch": 0.15, "learning_rate": 1.9233964558662675e-05, "loss": 1.4761, "step": 5553 }, { "epoch": 0.15, "learning_rate": 1.9233625006572142e-05, "loss": 1.3364, "step": 5554 }, { "epoch": 0.15, "learning_rate": 1.9233285382242062e-05, "loss": 1.5024, "step": 5555 }, { "epoch": 0.15, "learning_rate": 1.923294568567511e-05, "loss": 1.4629, "step": 5556 }, { "epoch": 0.15, "learning_rate": 1.9232605916873924e-05, "loss": 1.4087, "step": 5557 }, { "epoch": 0.15, "learning_rate": 1.9232266075841174e-05, "loss": 1.4756, "step": 5558 }, { "epoch": 0.15, "learning_rate": 1.9231926162579517e-05, "loss": 1.4424, "step": 5559 }, { "epoch": 0.15, "learning_rate": 1.9231586177091607e-05, "loss": 1.7988, "step": 5560 }, { "epoch": 0.15, "learning_rate": 1.923124611938011e-05, "loss": 1.4316, "step": 5561 }, { "epoch": 0.15, "learning_rate": 1.9230905989447686e-05, "loss": 1.3459, "step": 5562 }, { "epoch": 0.15, "learning_rate": 1.923056578729699e-05, "loss": 1.3718, "step": 5563 }, { "epoch": 0.15, "learning_rate": 1.923022551293069e-05, "loss": 1.3882, "step": 5564 }, { "epoch": 0.15, "learning_rate": 1.9229885166351446e-05, "loss": 1.3154, "step": 5565 }, { "epoch": 0.15, "learning_rate": 1.9229544747561924e-05, "loss": 1.5557, "step": 5566 }, { "epoch": 0.15, "learning_rate": 1.9229204256564782e-05, "loss": 1.439, "step": 5567 }, { "epoch": 0.15, "learning_rate": 1.9228863693362682e-05, "loss": 1.3152, "step": 5568 }, { "epoch": 0.15, "learning_rate": 1.9228523057958294e-05, "loss": 1.5684, "step": 5569 }, { "epoch": 0.15, "learning_rate": 1.922818235035428e-05, "loss": 1.438, "step": 5570 }, { "epoch": 0.15, "learning_rate": 1.922784157055331e-05, "loss": 1.3818, "step": 5571 }, { "epoch": 0.15, "learning_rate": 1.9227500718558048e-05, "loss": 1.5413, "step": 5572 }, { "epoch": 0.15, "learning_rate": 1.9227159794371156e-05, "loss": 1.3623, "step": 5573 }, { "epoch": 0.15, "learning_rate": 1.9226818797995306e-05, "loss": 1.5088, "step": 5574 }, { "epoch": 0.15, "learning_rate": 1.9226477729433163e-05, "loss": 1.3708, "step": 5575 }, { "epoch": 0.15, "learning_rate": 1.9226136588687398e-05, "loss": 1.262, "step": 5576 }, { "epoch": 0.15, "learning_rate": 1.922579537576068e-05, "loss": 1.3604, "step": 5577 }, { "epoch": 0.15, "learning_rate": 1.9225454090655675e-05, "loss": 1.3535, "step": 5578 }, { "epoch": 0.15, "learning_rate": 1.9225112733375057e-05, "loss": 1.3665, "step": 5579 }, { "epoch": 0.15, "learning_rate": 1.9224771303921493e-05, "loss": 1.4504, "step": 5580 }, { "epoch": 0.15, "learning_rate": 1.922442980229766e-05, "loss": 1.3281, "step": 5581 }, { "epoch": 0.15, "learning_rate": 1.9224088228506218e-05, "loss": 1.606, "step": 5582 }, { "epoch": 0.15, "learning_rate": 1.9223746582549853e-05, "loss": 1.3911, "step": 5583 }, { "epoch": 0.15, "learning_rate": 1.9223404864431235e-05, "loss": 1.4578, "step": 5584 }, { "epoch": 0.15, "learning_rate": 1.922306307415303e-05, "loss": 1.5186, "step": 5585 }, { "epoch": 0.15, "learning_rate": 1.9222721211717914e-05, "loss": 1.5637, "step": 5586 }, { "epoch": 0.15, "learning_rate": 1.922237927712857e-05, "loss": 1.5264, "step": 5587 }, { "epoch": 0.15, "learning_rate": 1.9222037270387663e-05, "loss": 1.3936, "step": 5588 }, { "epoch": 0.15, "learning_rate": 1.9221695191497875e-05, "loss": 1.5671, "step": 5589 }, { "epoch": 0.15, "learning_rate": 1.922135304046188e-05, "loss": 1.417, "step": 5590 }, { "epoch": 0.15, "learning_rate": 1.9221010817282353e-05, "loss": 1.4563, "step": 5591 }, { "epoch": 0.15, "learning_rate": 1.9220668521961976e-05, "loss": 1.3225, "step": 5592 }, { "epoch": 0.15, "learning_rate": 1.9220326154503425e-05, "loss": 1.4419, "step": 5593 }, { "epoch": 0.15, "learning_rate": 1.9219983714909376e-05, "loss": 1.2737, "step": 5594 }, { "epoch": 0.15, "learning_rate": 1.921964120318251e-05, "loss": 1.4561, "step": 5595 }, { "epoch": 0.15, "learning_rate": 1.9219298619325506e-05, "loss": 1.3604, "step": 5596 }, { "epoch": 0.15, "learning_rate": 1.9218955963341047e-05, "loss": 1.2629, "step": 5597 }, { "epoch": 0.15, "learning_rate": 1.9218613235231808e-05, "loss": 1.4819, "step": 5598 }, { "epoch": 0.15, "learning_rate": 1.9218270435000475e-05, "loss": 1.2305, "step": 5599 }, { "epoch": 0.15, "learning_rate": 1.921792756264973e-05, "loss": 1.3933, "step": 5600 }, { "epoch": 0.15, "learning_rate": 1.9217584618182256e-05, "loss": 1.4536, "step": 5601 }, { "epoch": 0.15, "learning_rate": 1.921724160160073e-05, "loss": 1.4592, "step": 5602 }, { "epoch": 0.15, "learning_rate": 1.9216898512907845e-05, "loss": 1.4907, "step": 5603 }, { "epoch": 0.15, "learning_rate": 1.921655535210628e-05, "loss": 1.4058, "step": 5604 }, { "epoch": 0.15, "learning_rate": 1.9216212119198715e-05, "loss": 1.4565, "step": 5605 }, { "epoch": 0.15, "learning_rate": 1.9215868814187845e-05, "loss": 1.5073, "step": 5606 }, { "epoch": 0.15, "learning_rate": 1.9215525437076347e-05, "loss": 1.5459, "step": 5607 }, { "epoch": 0.15, "learning_rate": 1.9215181987866913e-05, "loss": 1.5562, "step": 5608 }, { "epoch": 0.15, "learning_rate": 1.921483846656223e-05, "loss": 1.4346, "step": 5609 }, { "epoch": 0.15, "learning_rate": 1.9214494873164978e-05, "loss": 1.3494, "step": 5610 }, { "epoch": 0.15, "learning_rate": 1.9214151207677858e-05, "loss": 1.5645, "step": 5611 }, { "epoch": 0.15, "learning_rate": 1.921380747010355e-05, "loss": 1.5911, "step": 5612 }, { "epoch": 0.15, "learning_rate": 1.9213463660444745e-05, "loss": 1.344, "step": 5613 }, { "epoch": 0.15, "learning_rate": 1.921311977870413e-05, "loss": 1.522, "step": 5614 }, { "epoch": 0.15, "learning_rate": 1.9212775824884403e-05, "loss": 1.4331, "step": 5615 }, { "epoch": 0.15, "learning_rate": 1.9212431798988243e-05, "loss": 1.6191, "step": 5616 }, { "epoch": 0.15, "learning_rate": 1.9212087701018355e-05, "loss": 1.5007, "step": 5617 }, { "epoch": 0.15, "learning_rate": 1.9211743530977425e-05, "loss": 1.5444, "step": 5618 }, { "epoch": 0.15, "learning_rate": 1.9211399288868143e-05, "loss": 1.3203, "step": 5619 }, { "epoch": 0.15, "learning_rate": 1.9211054974693203e-05, "loss": 1.3484, "step": 5620 }, { "epoch": 0.15, "learning_rate": 1.9210710588455303e-05, "loss": 1.6208, "step": 5621 }, { "epoch": 0.15, "learning_rate": 1.921036613015713e-05, "loss": 1.3369, "step": 5622 }, { "epoch": 0.15, "learning_rate": 1.921002159980139e-05, "loss": 1.2654, "step": 5623 }, { "epoch": 0.15, "learning_rate": 1.9209676997390766e-05, "loss": 1.5337, "step": 5624 }, { "epoch": 0.15, "learning_rate": 1.9209332322927964e-05, "loss": 1.2324, "step": 5625 }, { "epoch": 0.15, "learning_rate": 1.9208987576415675e-05, "loss": 1.3586, "step": 5626 }, { "epoch": 0.15, "learning_rate": 1.9208642757856596e-05, "loss": 1.4937, "step": 5627 }, { "epoch": 0.15, "learning_rate": 1.920829786725343e-05, "loss": 1.2786, "step": 5628 }, { "epoch": 0.15, "learning_rate": 1.9207952904608865e-05, "loss": 1.4578, "step": 5629 }, { "epoch": 0.15, "learning_rate": 1.9207607869925613e-05, "loss": 1.387, "step": 5630 }, { "epoch": 0.15, "learning_rate": 1.9207262763206363e-05, "loss": 1.1946, "step": 5631 }, { "epoch": 0.15, "learning_rate": 1.920691758445382e-05, "loss": 1.3228, "step": 5632 }, { "epoch": 0.15, "learning_rate": 1.9206572333670683e-05, "loss": 1.3342, "step": 5633 }, { "epoch": 0.15, "learning_rate": 1.9206227010859653e-05, "loss": 1.4026, "step": 5634 }, { "epoch": 0.15, "learning_rate": 1.9205881616023434e-05, "loss": 1.374, "step": 5635 }, { "epoch": 0.15, "learning_rate": 1.9205536149164724e-05, "loss": 1.3835, "step": 5636 }, { "epoch": 0.15, "learning_rate": 1.920519061028623e-05, "loss": 1.3132, "step": 5637 }, { "epoch": 0.15, "learning_rate": 1.920484499939065e-05, "loss": 1.4802, "step": 5638 }, { "epoch": 0.15, "learning_rate": 1.9204499316480694e-05, "loss": 1.3057, "step": 5639 }, { "epoch": 0.15, "learning_rate": 1.920415356155906e-05, "loss": 1.3467, "step": 5640 }, { "epoch": 0.15, "learning_rate": 1.920380773462846e-05, "loss": 1.4023, "step": 5641 }, { "epoch": 0.15, "learning_rate": 1.9203461835691596e-05, "loss": 1.313, "step": 5642 }, { "epoch": 0.15, "learning_rate": 1.9203115864751172e-05, "loss": 1.438, "step": 5643 }, { "epoch": 0.15, "learning_rate": 1.92027698218099e-05, "loss": 1.4277, "step": 5644 }, { "epoch": 0.15, "learning_rate": 1.9202423706870483e-05, "loss": 1.3503, "step": 5645 }, { "epoch": 0.15, "learning_rate": 1.920207751993563e-05, "loss": 1.2217, "step": 5646 }, { "epoch": 0.15, "learning_rate": 1.920173126100805e-05, "loss": 1.5752, "step": 5647 }, { "epoch": 0.15, "learning_rate": 1.9201384930090452e-05, "loss": 1.457, "step": 5648 }, { "epoch": 0.15, "learning_rate": 1.9201038527185546e-05, "loss": 1.3464, "step": 5649 }, { "epoch": 0.15, "learning_rate": 1.920069205229604e-05, "loss": 1.5942, "step": 5650 }, { "epoch": 0.15, "learning_rate": 1.9200345505424644e-05, "loss": 1.186, "step": 5651 }, { "epoch": 0.15, "learning_rate": 1.9199998886574072e-05, "loss": 1.3591, "step": 5652 }, { "epoch": 0.15, "learning_rate": 1.9199652195747038e-05, "loss": 1.3704, "step": 5653 }, { "epoch": 0.15, "learning_rate": 1.919930543294625e-05, "loss": 1.4048, "step": 5654 }, { "epoch": 0.15, "learning_rate": 1.919895859817442e-05, "loss": 1.3232, "step": 5655 }, { "epoch": 0.15, "learning_rate": 1.919861169143426e-05, "loss": 1.3921, "step": 5656 }, { "epoch": 0.15, "learning_rate": 1.9198264712728494e-05, "loss": 1.2717, "step": 5657 }, { "epoch": 0.15, "learning_rate": 1.9197917662059828e-05, "loss": 1.5078, "step": 5658 }, { "epoch": 0.15, "learning_rate": 1.919757053943098e-05, "loss": 1.501, "step": 5659 }, { "epoch": 0.15, "learning_rate": 1.9197223344844666e-05, "loss": 1.2986, "step": 5660 }, { "epoch": 0.15, "learning_rate": 1.9196876078303602e-05, "loss": 1.2793, "step": 5661 }, { "epoch": 0.15, "learning_rate": 1.91965287398105e-05, "loss": 1.4233, "step": 5662 }, { "epoch": 0.15, "learning_rate": 1.9196181329368083e-05, "loss": 1.5381, "step": 5663 }, { "epoch": 0.15, "learning_rate": 1.919583384697907e-05, "loss": 1.813, "step": 5664 }, { "epoch": 0.15, "learning_rate": 1.9195486292646178e-05, "loss": 1.5386, "step": 5665 }, { "epoch": 0.15, "learning_rate": 1.919513866637212e-05, "loss": 1.478, "step": 5666 }, { "epoch": 0.15, "learning_rate": 1.9194790968159625e-05, "loss": 1.2061, "step": 5667 }, { "epoch": 0.15, "learning_rate": 1.919444319801141e-05, "loss": 1.5322, "step": 5668 }, { "epoch": 0.15, "learning_rate": 1.9194095355930193e-05, "loss": 1.4355, "step": 5669 }, { "epoch": 0.15, "learning_rate": 1.9193747441918696e-05, "loss": 1.4517, "step": 5670 }, { "epoch": 0.15, "learning_rate": 1.9193399455979644e-05, "loss": 1.4673, "step": 5671 }, { "epoch": 0.15, "learning_rate": 1.9193051398115755e-05, "loss": 1.4155, "step": 5672 }, { "epoch": 0.15, "learning_rate": 1.919270326832976e-05, "loss": 1.3538, "step": 5673 }, { "epoch": 0.15, "learning_rate": 1.9192355066624372e-05, "loss": 1.3538, "step": 5674 }, { "epoch": 0.15, "learning_rate": 1.9192006793002323e-05, "loss": 1.499, "step": 5675 }, { "epoch": 0.16, "learning_rate": 1.9191658447466337e-05, "loss": 1.4954, "step": 5676 }, { "epoch": 0.16, "learning_rate": 1.9191310030019137e-05, "loss": 1.3677, "step": 5677 }, { "epoch": 0.16, "learning_rate": 1.9190961540663447e-05, "loss": 1.4844, "step": 5678 }, { "epoch": 0.16, "learning_rate": 1.9190612979401996e-05, "loss": 1.3538, "step": 5679 }, { "epoch": 0.16, "learning_rate": 1.919026434623751e-05, "loss": 1.6372, "step": 5680 }, { "epoch": 0.16, "learning_rate": 1.918991564117272e-05, "loss": 1.3955, "step": 5681 }, { "epoch": 0.16, "learning_rate": 1.9189566864210352e-05, "loss": 1.5156, "step": 5682 }, { "epoch": 0.16, "learning_rate": 1.918921801535313e-05, "loss": 1.3528, "step": 5683 }, { "epoch": 0.16, "learning_rate": 1.9188869094603792e-05, "loss": 1.3735, "step": 5684 }, { "epoch": 0.16, "learning_rate": 1.9188520101965063e-05, "loss": 1.4788, "step": 5685 }, { "epoch": 0.16, "learning_rate": 1.918817103743967e-05, "loss": 1.4375, "step": 5686 }, { "epoch": 0.16, "learning_rate": 1.918782190103035e-05, "loss": 1.4873, "step": 5687 }, { "epoch": 0.16, "learning_rate": 1.9187472692739827e-05, "loss": 1.4478, "step": 5688 }, { "epoch": 0.16, "learning_rate": 1.9187123412570844e-05, "loss": 1.2842, "step": 5689 }, { "epoch": 0.16, "learning_rate": 1.9186774060526125e-05, "loss": 1.4443, "step": 5690 }, { "epoch": 0.16, "learning_rate": 1.9186424636608407e-05, "loss": 1.1128, "step": 5691 }, { "epoch": 0.16, "learning_rate": 1.918607514082042e-05, "loss": 1.4431, "step": 5692 }, { "epoch": 0.16, "learning_rate": 1.91857255731649e-05, "loss": 1.5156, "step": 5693 }, { "epoch": 0.16, "learning_rate": 1.9185375933644586e-05, "loss": 1.4561, "step": 5694 }, { "epoch": 0.16, "learning_rate": 1.9185026222262206e-05, "loss": 1.4766, "step": 5695 }, { "epoch": 0.16, "learning_rate": 1.9184676439020504e-05, "loss": 1.3679, "step": 5696 }, { "epoch": 0.16, "learning_rate": 1.918432658392221e-05, "loss": 1.3892, "step": 5697 }, { "epoch": 0.16, "learning_rate": 1.9183976656970066e-05, "loss": 1.3804, "step": 5698 }, { "epoch": 0.16, "learning_rate": 1.9183626658166804e-05, "loss": 1.4731, "step": 5699 }, { "epoch": 0.16, "learning_rate": 1.918327658751517e-05, "loss": 1.3794, "step": 5700 }, { "epoch": 0.16, "learning_rate": 1.9182926445017893e-05, "loss": 1.3091, "step": 5701 }, { "epoch": 0.16, "learning_rate": 1.918257623067772e-05, "loss": 1.4888, "step": 5702 }, { "epoch": 0.16, "learning_rate": 1.918222594449739e-05, "loss": 1.5396, "step": 5703 }, { "epoch": 0.16, "learning_rate": 1.9181875586479638e-05, "loss": 1.3843, "step": 5704 }, { "epoch": 0.16, "learning_rate": 1.918152515662721e-05, "loss": 1.4121, "step": 5705 }, { "epoch": 0.16, "learning_rate": 1.918117465494285e-05, "loss": 1.3458, "step": 5706 }, { "epoch": 0.16, "learning_rate": 1.9180824081429296e-05, "loss": 1.3127, "step": 5707 }, { "epoch": 0.16, "learning_rate": 1.9180473436089292e-05, "loss": 1.4639, "step": 5708 }, { "epoch": 0.16, "learning_rate": 1.9180122718925577e-05, "loss": 1.385, "step": 5709 }, { "epoch": 0.16, "learning_rate": 1.91797719299409e-05, "loss": 1.52, "step": 5710 }, { "epoch": 0.16, "learning_rate": 1.9179421069138006e-05, "loss": 1.3447, "step": 5711 }, { "epoch": 0.16, "learning_rate": 1.9179070136519636e-05, "loss": 1.5315, "step": 5712 }, { "epoch": 0.16, "learning_rate": 1.917871913208854e-05, "loss": 1.4502, "step": 5713 }, { "epoch": 0.16, "learning_rate": 1.917836805584746e-05, "loss": 1.2715, "step": 5714 }, { "epoch": 0.16, "learning_rate": 1.9178016907799147e-05, "loss": 1.3174, "step": 5715 }, { "epoch": 0.16, "learning_rate": 1.917766568794634e-05, "loss": 1.4607, "step": 5716 }, { "epoch": 0.16, "learning_rate": 1.9177314396291796e-05, "loss": 1.5254, "step": 5717 }, { "epoch": 0.16, "learning_rate": 1.917696303283826e-05, "loss": 1.3208, "step": 5718 }, { "epoch": 0.16, "learning_rate": 1.917661159758848e-05, "loss": 1.2676, "step": 5719 }, { "epoch": 0.16, "learning_rate": 1.91762600905452e-05, "loss": 1.395, "step": 5720 }, { "epoch": 0.16, "learning_rate": 1.9175908511711186e-05, "loss": 1.2134, "step": 5721 }, { "epoch": 0.16, "learning_rate": 1.9175556861089174e-05, "loss": 1.2925, "step": 5722 }, { "epoch": 0.16, "learning_rate": 1.917520513868192e-05, "loss": 1.4248, "step": 5723 }, { "epoch": 0.16, "learning_rate": 1.9174853344492175e-05, "loss": 1.5298, "step": 5724 }, { "epoch": 0.16, "learning_rate": 1.9174501478522692e-05, "loss": 1.4539, "step": 5725 }, { "epoch": 0.16, "learning_rate": 1.9174149540776222e-05, "loss": 1.4841, "step": 5726 }, { "epoch": 0.16, "learning_rate": 1.917379753125552e-05, "loss": 1.3901, "step": 5727 }, { "epoch": 0.16, "learning_rate": 1.9173445449963344e-05, "loss": 1.4424, "step": 5728 }, { "epoch": 0.16, "learning_rate": 1.9173093296902445e-05, "loss": 1.2942, "step": 5729 }, { "epoch": 0.16, "learning_rate": 1.917274107207557e-05, "loss": 1.3777, "step": 5730 }, { "epoch": 0.16, "learning_rate": 1.9172388775485487e-05, "loss": 1.3975, "step": 5731 }, { "epoch": 0.16, "learning_rate": 1.9172036407134952e-05, "loss": 1.8315, "step": 5732 }, { "epoch": 0.16, "learning_rate": 1.917168396702671e-05, "loss": 1.5342, "step": 5733 }, { "epoch": 0.16, "learning_rate": 1.9171331455163527e-05, "loss": 1.4731, "step": 5734 }, { "epoch": 0.16, "learning_rate": 1.917097887154816e-05, "loss": 1.2898, "step": 5735 }, { "epoch": 0.16, "learning_rate": 1.9170626216183368e-05, "loss": 1.3718, "step": 5736 }, { "epoch": 0.16, "learning_rate": 1.917027348907191e-05, "loss": 1.2783, "step": 5737 }, { "epoch": 0.16, "learning_rate": 1.916992069021654e-05, "loss": 1.5161, "step": 5738 }, { "epoch": 0.16, "learning_rate": 1.9169567819620024e-05, "loss": 1.4873, "step": 5739 }, { "epoch": 0.16, "learning_rate": 1.9169214877285123e-05, "loss": 1.386, "step": 5740 }, { "epoch": 0.16, "learning_rate": 1.9168861863214596e-05, "loss": 1.5288, "step": 5741 }, { "epoch": 0.16, "learning_rate": 1.9168508777411203e-05, "loss": 1.4448, "step": 5742 }, { "epoch": 0.16, "learning_rate": 1.9168155619877712e-05, "loss": 1.4175, "step": 5743 }, { "epoch": 0.16, "learning_rate": 1.9167802390616882e-05, "loss": 1.5642, "step": 5744 }, { "epoch": 0.16, "learning_rate": 1.9167449089631474e-05, "loss": 1.4351, "step": 5745 }, { "epoch": 0.16, "learning_rate": 1.9167095716924256e-05, "loss": 1.6724, "step": 5746 }, { "epoch": 0.16, "learning_rate": 1.9166742272497996e-05, "loss": 1.3665, "step": 5747 }, { "epoch": 0.16, "learning_rate": 1.916638875635545e-05, "loss": 1.4363, "step": 5748 }, { "epoch": 0.16, "learning_rate": 1.916603516849939e-05, "loss": 1.5459, "step": 5749 }, { "epoch": 0.16, "learning_rate": 1.9165681508932584e-05, "loss": 1.2791, "step": 5750 }, { "epoch": 0.16, "learning_rate": 1.9165327777657793e-05, "loss": 1.2231, "step": 5751 }, { "epoch": 0.16, "learning_rate": 1.9164973974677787e-05, "loss": 1.4429, "step": 5752 }, { "epoch": 0.16, "learning_rate": 1.9164620099995334e-05, "loss": 1.4805, "step": 5753 }, { "epoch": 0.16, "learning_rate": 1.9164266153613205e-05, "loss": 1.5083, "step": 5754 }, { "epoch": 0.16, "learning_rate": 1.9163912135534166e-05, "loss": 1.4619, "step": 5755 }, { "epoch": 0.16, "learning_rate": 1.9163558045760985e-05, "loss": 1.4729, "step": 5756 }, { "epoch": 0.16, "learning_rate": 1.916320388429644e-05, "loss": 1.4888, "step": 5757 }, { "epoch": 0.16, "learning_rate": 1.9162849651143293e-05, "loss": 1.4258, "step": 5758 }, { "epoch": 0.16, "learning_rate": 1.9162495346304323e-05, "loss": 1.4604, "step": 5759 }, { "epoch": 0.16, "learning_rate": 1.9162140969782292e-05, "loss": 1.5708, "step": 5760 }, { "epoch": 0.16, "learning_rate": 1.9161786521579984e-05, "loss": 1.3826, "step": 5761 }, { "epoch": 0.16, "learning_rate": 1.916143200170016e-05, "loss": 1.4875, "step": 5762 }, { "epoch": 0.16, "learning_rate": 1.9161077410145607e-05, "loss": 1.3037, "step": 5763 }, { "epoch": 0.16, "learning_rate": 1.916072274691909e-05, "loss": 1.4114, "step": 5764 }, { "epoch": 0.16, "learning_rate": 1.916036801202338e-05, "loss": 1.4478, "step": 5765 }, { "epoch": 0.16, "learning_rate": 1.9160013205461267e-05, "loss": 1.3955, "step": 5766 }, { "epoch": 0.16, "learning_rate": 1.9159658327235513e-05, "loss": 1.3032, "step": 5767 }, { "epoch": 0.16, "learning_rate": 1.9159303377348902e-05, "loss": 1.4146, "step": 5768 }, { "epoch": 0.16, "learning_rate": 1.9158948355804204e-05, "loss": 1.3733, "step": 5769 }, { "epoch": 0.16, "learning_rate": 1.9158593262604206e-05, "loss": 1.3008, "step": 5770 }, { "epoch": 0.16, "learning_rate": 1.9158238097751678e-05, "loss": 1.4917, "step": 5771 }, { "epoch": 0.16, "learning_rate": 1.9157882861249405e-05, "loss": 1.4214, "step": 5772 }, { "epoch": 0.16, "learning_rate": 1.915752755310016e-05, "loss": 1.4648, "step": 5773 }, { "epoch": 0.16, "learning_rate": 1.9157172173306722e-05, "loss": 1.416, "step": 5774 }, { "epoch": 0.16, "learning_rate": 1.915681672187188e-05, "loss": 1.6147, "step": 5775 }, { "epoch": 0.16, "learning_rate": 1.915646119879841e-05, "loss": 1.4358, "step": 5776 }, { "epoch": 0.16, "learning_rate": 1.9156105604089093e-05, "loss": 1.3672, "step": 5777 }, { "epoch": 0.16, "learning_rate": 1.9155749937746707e-05, "loss": 1.2812, "step": 5778 }, { "epoch": 0.16, "learning_rate": 1.9155394199774045e-05, "loss": 1.3313, "step": 5779 }, { "epoch": 0.16, "learning_rate": 1.9155038390173878e-05, "loss": 1.3333, "step": 5780 }, { "epoch": 0.16, "learning_rate": 1.9154682508948998e-05, "loss": 1.3638, "step": 5781 }, { "epoch": 0.16, "learning_rate": 1.915432655610219e-05, "loss": 1.4771, "step": 5782 }, { "epoch": 0.16, "learning_rate": 1.9153970531636233e-05, "loss": 1.5576, "step": 5783 }, { "epoch": 0.16, "learning_rate": 1.9153614435553917e-05, "loss": 1.4912, "step": 5784 }, { "epoch": 0.16, "learning_rate": 1.9153258267858022e-05, "loss": 1.3804, "step": 5785 }, { "epoch": 0.16, "learning_rate": 1.915290202855134e-05, "loss": 1.4409, "step": 5786 }, { "epoch": 0.16, "learning_rate": 1.9152545717636657e-05, "loss": 1.3564, "step": 5787 }, { "epoch": 0.16, "learning_rate": 1.915218933511676e-05, "loss": 1.3176, "step": 5788 }, { "epoch": 0.16, "learning_rate": 1.9151832880994438e-05, "loss": 1.4258, "step": 5789 }, { "epoch": 0.16, "learning_rate": 1.915147635527248e-05, "loss": 1.46, "step": 5790 }, { "epoch": 0.16, "learning_rate": 1.9151119757953673e-05, "loss": 1.21, "step": 5791 }, { "epoch": 0.16, "learning_rate": 1.9150763089040807e-05, "loss": 1.3923, "step": 5792 }, { "epoch": 0.16, "learning_rate": 1.9150406348536675e-05, "loss": 1.4099, "step": 5793 }, { "epoch": 0.16, "learning_rate": 1.9150049536444067e-05, "loss": 1.4399, "step": 5794 }, { "epoch": 0.16, "learning_rate": 1.9149692652765774e-05, "loss": 1.2839, "step": 5795 }, { "epoch": 0.16, "learning_rate": 1.9149335697504587e-05, "loss": 1.4709, "step": 5796 }, { "epoch": 0.16, "learning_rate": 1.91489786706633e-05, "loss": 1.3174, "step": 5797 }, { "epoch": 0.16, "learning_rate": 1.9148621572244704e-05, "loss": 1.4592, "step": 5798 }, { "epoch": 0.16, "learning_rate": 1.91482644022516e-05, "loss": 1.4226, "step": 5799 }, { "epoch": 0.16, "learning_rate": 1.9147907160686774e-05, "loss": 1.5271, "step": 5800 }, { "epoch": 0.16, "learning_rate": 1.9147549847553025e-05, "loss": 1.3435, "step": 5801 }, { "epoch": 0.16, "learning_rate": 1.9147192462853145e-05, "loss": 1.2888, "step": 5802 }, { "epoch": 0.16, "learning_rate": 1.9146835006589933e-05, "loss": 1.3799, "step": 5803 }, { "epoch": 0.16, "learning_rate": 1.9146477478766187e-05, "loss": 1.5083, "step": 5804 }, { "epoch": 0.16, "learning_rate": 1.91461198793847e-05, "loss": 1.5332, "step": 5805 }, { "epoch": 0.16, "learning_rate": 1.9145762208448278e-05, "loss": 1.3464, "step": 5806 }, { "epoch": 0.16, "learning_rate": 1.9145404465959708e-05, "loss": 1.4307, "step": 5807 }, { "epoch": 0.16, "learning_rate": 1.9145046651921794e-05, "loss": 1.4321, "step": 5808 }, { "epoch": 0.16, "learning_rate": 1.9144688766337335e-05, "loss": 1.384, "step": 5809 }, { "epoch": 0.16, "learning_rate": 1.914433080920913e-05, "loss": 1.3157, "step": 5810 }, { "epoch": 0.16, "learning_rate": 1.9143972780539982e-05, "loss": 1.2263, "step": 5811 }, { "epoch": 0.16, "learning_rate": 1.9143614680332695e-05, "loss": 1.3113, "step": 5812 }, { "epoch": 0.16, "learning_rate": 1.9143256508590064e-05, "loss": 1.4961, "step": 5813 }, { "epoch": 0.16, "learning_rate": 1.9142898265314887e-05, "loss": 1.4502, "step": 5814 }, { "epoch": 0.16, "learning_rate": 1.914253995050998e-05, "loss": 1.353, "step": 5815 }, { "epoch": 0.16, "learning_rate": 1.914218156417814e-05, "loss": 1.283, "step": 5816 }, { "epoch": 0.16, "learning_rate": 1.9141823106322167e-05, "loss": 1.415, "step": 5817 }, { "epoch": 0.16, "learning_rate": 1.9141464576944872e-05, "loss": 1.4082, "step": 5818 }, { "epoch": 0.16, "learning_rate": 1.9141105976049054e-05, "loss": 1.2898, "step": 5819 }, { "epoch": 0.16, "learning_rate": 1.9140747303637523e-05, "loss": 1.3894, "step": 5820 }, { "epoch": 0.16, "learning_rate": 1.9140388559713084e-05, "loss": 1.4468, "step": 5821 }, { "epoch": 0.16, "learning_rate": 1.9140029744278543e-05, "loss": 1.2505, "step": 5822 }, { "epoch": 0.16, "learning_rate": 1.9139670857336704e-05, "loss": 1.4285, "step": 5823 }, { "epoch": 0.16, "learning_rate": 1.913931189889038e-05, "loss": 1.3906, "step": 5824 }, { "epoch": 0.16, "learning_rate": 1.913895286894238e-05, "loss": 1.3682, "step": 5825 }, { "epoch": 0.16, "learning_rate": 1.9138593767495504e-05, "loss": 1.4092, "step": 5826 }, { "epoch": 0.16, "learning_rate": 1.9138234594552574e-05, "loss": 1.2559, "step": 5827 }, { "epoch": 0.16, "learning_rate": 1.913787535011639e-05, "loss": 1.7524, "step": 5828 }, { "epoch": 0.16, "learning_rate": 1.9137516034189768e-05, "loss": 1.3691, "step": 5829 }, { "epoch": 0.16, "learning_rate": 1.9137156646775514e-05, "loss": 1.4189, "step": 5830 }, { "epoch": 0.16, "learning_rate": 1.9136797187876446e-05, "loss": 1.3821, "step": 5831 }, { "epoch": 0.16, "learning_rate": 1.9136437657495373e-05, "loss": 1.3374, "step": 5832 }, { "epoch": 0.16, "learning_rate": 1.9136078055635107e-05, "loss": 1.3774, "step": 5833 }, { "epoch": 0.16, "learning_rate": 1.9135718382298464e-05, "loss": 1.5166, "step": 5834 }, { "epoch": 0.16, "learning_rate": 1.9135358637488256e-05, "loss": 1.4221, "step": 5835 }, { "epoch": 0.16, "learning_rate": 1.9134998821207296e-05, "loss": 1.4641, "step": 5836 }, { "epoch": 0.16, "learning_rate": 1.9134638933458404e-05, "loss": 1.3606, "step": 5837 }, { "epoch": 0.16, "learning_rate": 1.9134278974244388e-05, "loss": 1.4175, "step": 5838 }, { "epoch": 0.16, "learning_rate": 1.913391894356807e-05, "loss": 1.2937, "step": 5839 }, { "epoch": 0.16, "learning_rate": 1.9133558841432265e-05, "loss": 1.4006, "step": 5840 }, { "epoch": 0.16, "learning_rate": 1.9133198667839793e-05, "loss": 1.6704, "step": 5841 }, { "epoch": 0.16, "learning_rate": 1.9132838422793468e-05, "loss": 1.2051, "step": 5842 }, { "epoch": 0.16, "learning_rate": 1.913247810629611e-05, "loss": 1.4941, "step": 5843 }, { "epoch": 0.16, "learning_rate": 1.9132117718350536e-05, "loss": 1.3223, "step": 5844 }, { "epoch": 0.16, "learning_rate": 1.913175725895957e-05, "loss": 1.2939, "step": 5845 }, { "epoch": 0.16, "learning_rate": 1.913139672812603e-05, "loss": 1.3979, "step": 5846 }, { "epoch": 0.16, "learning_rate": 1.913103612585273e-05, "loss": 1.2686, "step": 5847 }, { "epoch": 0.16, "learning_rate": 1.9130675452142502e-05, "loss": 1.5522, "step": 5848 }, { "epoch": 0.16, "learning_rate": 1.9130314706998157e-05, "loss": 1.4248, "step": 5849 }, { "epoch": 0.16, "learning_rate": 1.912995389042253e-05, "loss": 1.5913, "step": 5850 }, { "epoch": 0.16, "learning_rate": 1.9129593002418433e-05, "loss": 1.5449, "step": 5851 }, { "epoch": 0.16, "learning_rate": 1.9129232042988698e-05, "loss": 1.4604, "step": 5852 }, { "epoch": 0.16, "learning_rate": 1.9128871012136142e-05, "loss": 1.4233, "step": 5853 }, { "epoch": 0.16, "learning_rate": 1.912850990986359e-05, "loss": 1.834, "step": 5854 }, { "epoch": 0.16, "learning_rate": 1.912814873617387e-05, "loss": 1.3616, "step": 5855 }, { "epoch": 0.16, "learning_rate": 1.912778749106981e-05, "loss": 1.5464, "step": 5856 }, { "epoch": 0.16, "learning_rate": 1.9127426174554226e-05, "loss": 1.4226, "step": 5857 }, { "epoch": 0.16, "learning_rate": 1.9127064786629957e-05, "loss": 1.4946, "step": 5858 }, { "epoch": 0.16, "learning_rate": 1.9126703327299822e-05, "loss": 1.3623, "step": 5859 }, { "epoch": 0.16, "learning_rate": 1.9126341796566655e-05, "loss": 1.2771, "step": 5860 }, { "epoch": 0.16, "learning_rate": 1.912598019443328e-05, "loss": 1.5444, "step": 5861 }, { "epoch": 0.16, "learning_rate": 1.9125618520902526e-05, "loss": 1.3369, "step": 5862 }, { "epoch": 0.16, "learning_rate": 1.9125256775977225e-05, "loss": 1.3901, "step": 5863 }, { "epoch": 0.16, "learning_rate": 1.9124894959660205e-05, "loss": 1.4553, "step": 5864 }, { "epoch": 0.16, "learning_rate": 1.91245330719543e-05, "loss": 1.25, "step": 5865 }, { "epoch": 0.16, "learning_rate": 1.9124171112862335e-05, "loss": 1.4136, "step": 5866 }, { "epoch": 0.16, "learning_rate": 1.9123809082387147e-05, "loss": 1.3506, "step": 5867 }, { "epoch": 0.16, "learning_rate": 1.9123446980531567e-05, "loss": 1.8311, "step": 5868 }, { "epoch": 0.16, "learning_rate": 1.912308480729843e-05, "loss": 1.4504, "step": 5869 }, { "epoch": 0.16, "learning_rate": 1.912272256269057e-05, "loss": 1.4163, "step": 5870 }, { "epoch": 0.16, "learning_rate": 1.9122360246710813e-05, "loss": 1.429, "step": 5871 }, { "epoch": 0.16, "learning_rate": 1.9121997859362e-05, "loss": 1.5479, "step": 5872 }, { "epoch": 0.16, "learning_rate": 1.9121635400646966e-05, "loss": 1.4912, "step": 5873 }, { "epoch": 0.16, "learning_rate": 1.9121272870568547e-05, "loss": 1.4575, "step": 5874 }, { "epoch": 0.16, "learning_rate": 1.9120910269129577e-05, "loss": 1.2893, "step": 5875 }, { "epoch": 0.16, "learning_rate": 1.9120547596332892e-05, "loss": 1.7803, "step": 5876 }, { "epoch": 0.16, "learning_rate": 1.9120184852181335e-05, "loss": 1.4348, "step": 5877 }, { "epoch": 0.16, "learning_rate": 1.911982203667774e-05, "loss": 1.3269, "step": 5878 }, { "epoch": 0.16, "learning_rate": 1.9119459149824943e-05, "loss": 1.4761, "step": 5879 }, { "epoch": 0.16, "learning_rate": 1.911909619162579e-05, "loss": 1.3398, "step": 5880 }, { "epoch": 0.16, "learning_rate": 1.9118733162083113e-05, "loss": 1.2336, "step": 5881 }, { "epoch": 0.16, "learning_rate": 1.9118370061199754e-05, "loss": 1.3486, "step": 5882 }, { "epoch": 0.16, "learning_rate": 1.9118006888978563e-05, "loss": 1.2416, "step": 5883 }, { "epoch": 0.16, "learning_rate": 1.9117643645422367e-05, "loss": 1.3965, "step": 5884 }, { "epoch": 0.16, "learning_rate": 1.9117280330534017e-05, "loss": 1.4517, "step": 5885 }, { "epoch": 0.16, "learning_rate": 1.9116916944316352e-05, "loss": 1.4194, "step": 5886 }, { "epoch": 0.16, "learning_rate": 1.9116553486772217e-05, "loss": 1.4124, "step": 5887 }, { "epoch": 0.16, "learning_rate": 1.9116189957904452e-05, "loss": 1.2046, "step": 5888 }, { "epoch": 0.16, "learning_rate": 1.9115826357715907e-05, "loss": 1.3237, "step": 5889 }, { "epoch": 0.16, "learning_rate": 1.911546268620942e-05, "loss": 1.4563, "step": 5890 }, { "epoch": 0.16, "learning_rate": 1.911509894338784e-05, "loss": 1.2612, "step": 5891 }, { "epoch": 0.16, "learning_rate": 1.9114735129254013e-05, "loss": 1.4307, "step": 5892 }, { "epoch": 0.16, "learning_rate": 1.9114371243810782e-05, "loss": 1.4834, "step": 5893 }, { "epoch": 0.16, "learning_rate": 1.9114007287061e-05, "loss": 1.3809, "step": 5894 }, { "epoch": 0.16, "learning_rate": 1.9113643259007507e-05, "loss": 1.3777, "step": 5895 }, { "epoch": 0.16, "learning_rate": 1.911327915965316e-05, "loss": 1.4163, "step": 5896 }, { "epoch": 0.16, "learning_rate": 1.91129149890008e-05, "loss": 1.3706, "step": 5897 }, { "epoch": 0.16, "learning_rate": 1.9112550747053275e-05, "loss": 1.4741, "step": 5898 }, { "epoch": 0.16, "learning_rate": 1.911218643381344e-05, "loss": 1.5469, "step": 5899 }, { "epoch": 0.16, "learning_rate": 1.9111822049284147e-05, "loss": 1.3772, "step": 5900 }, { "epoch": 0.16, "learning_rate": 1.9111457593468238e-05, "loss": 1.3367, "step": 5901 }, { "epoch": 0.16, "learning_rate": 1.911109306636857e-05, "loss": 1.3845, "step": 5902 }, { "epoch": 0.16, "learning_rate": 1.9110728467987997e-05, "loss": 1.3711, "step": 5903 }, { "epoch": 0.16, "learning_rate": 1.9110363798329364e-05, "loss": 1.3159, "step": 5904 }, { "epoch": 0.16, "learning_rate": 1.910999905739553e-05, "loss": 1.4597, "step": 5905 }, { "epoch": 0.16, "learning_rate": 1.910963424518935e-05, "loss": 1.3694, "step": 5906 }, { "epoch": 0.16, "learning_rate": 1.9109269361713672e-05, "loss": 1.5305, "step": 5907 }, { "epoch": 0.16, "learning_rate": 1.9108904406971356e-05, "loss": 1.4341, "step": 5908 }, { "epoch": 0.16, "learning_rate": 1.9108539380965257e-05, "loss": 1.2483, "step": 5909 }, { "epoch": 0.16, "learning_rate": 1.9108174283698226e-05, "loss": 1.3125, "step": 5910 }, { "epoch": 0.16, "learning_rate": 1.9107809115173125e-05, "loss": 1.4299, "step": 5911 }, { "epoch": 0.16, "learning_rate": 1.9107443875392807e-05, "loss": 1.54, "step": 5912 }, { "epoch": 0.16, "learning_rate": 1.9107078564360128e-05, "loss": 1.3237, "step": 5913 }, { "epoch": 0.16, "learning_rate": 1.9106713182077952e-05, "loss": 1.314, "step": 5914 }, { "epoch": 0.16, "learning_rate": 1.9106347728549134e-05, "loss": 1.3313, "step": 5915 }, { "epoch": 0.16, "learning_rate": 1.9105982203776534e-05, "loss": 1.4712, "step": 5916 }, { "epoch": 0.16, "learning_rate": 1.910561660776301e-05, "loss": 1.377, "step": 5917 }, { "epoch": 0.16, "learning_rate": 1.910525094051142e-05, "loss": 1.3635, "step": 5918 }, { "epoch": 0.16, "learning_rate": 1.9104885202024635e-05, "loss": 1.4038, "step": 5919 }, { "epoch": 0.16, "learning_rate": 1.9104519392305503e-05, "loss": 1.4766, "step": 5920 }, { "epoch": 0.16, "learning_rate": 1.9104153511356898e-05, "loss": 1.4771, "step": 5921 }, { "epoch": 0.16, "learning_rate": 1.9103787559181674e-05, "loss": 1.3982, "step": 5922 }, { "epoch": 0.16, "learning_rate": 1.9103421535782696e-05, "loss": 1.4775, "step": 5923 }, { "epoch": 0.16, "learning_rate": 1.9103055441162833e-05, "loss": 1.5557, "step": 5924 }, { "epoch": 0.16, "learning_rate": 1.9102689275324945e-05, "loss": 1.52, "step": 5925 }, { "epoch": 0.16, "learning_rate": 1.910232303827189e-05, "loss": 1.5251, "step": 5926 }, { "epoch": 0.16, "learning_rate": 1.9101956730006544e-05, "loss": 1.5132, "step": 5927 }, { "epoch": 0.16, "learning_rate": 1.9101590350531767e-05, "loss": 1.3062, "step": 5928 }, { "epoch": 0.16, "learning_rate": 1.910122389985043e-05, "loss": 1.428, "step": 5929 }, { "epoch": 0.16, "learning_rate": 1.9100857377965398e-05, "loss": 1.2976, "step": 5930 }, { "epoch": 0.16, "learning_rate": 1.910049078487953e-05, "loss": 1.3828, "step": 5931 }, { "epoch": 0.16, "learning_rate": 1.9100124120595705e-05, "loss": 1.4553, "step": 5932 }, { "epoch": 0.16, "learning_rate": 1.9099757385116793e-05, "loss": 1.3601, "step": 5933 }, { "epoch": 0.16, "learning_rate": 1.9099390578445652e-05, "loss": 1.425, "step": 5934 }, { "epoch": 0.16, "learning_rate": 1.9099023700585163e-05, "loss": 1.2739, "step": 5935 }, { "epoch": 0.16, "learning_rate": 1.909865675153819e-05, "loss": 1.3728, "step": 5936 }, { "epoch": 0.16, "learning_rate": 1.90982897313076e-05, "loss": 1.4561, "step": 5937 }, { "epoch": 0.16, "learning_rate": 1.9097922639896274e-05, "loss": 1.5454, "step": 5938 }, { "epoch": 0.16, "learning_rate": 1.9097555477307076e-05, "loss": 1.3989, "step": 5939 }, { "epoch": 0.16, "learning_rate": 1.9097188243542885e-05, "loss": 1.2471, "step": 5940 }, { "epoch": 0.16, "learning_rate": 1.909682093860657e-05, "loss": 1.3462, "step": 5941 }, { "epoch": 0.16, "learning_rate": 1.9096453562501008e-05, "loss": 1.3584, "step": 5942 }, { "epoch": 0.16, "learning_rate": 1.9096086115229068e-05, "loss": 1.2947, "step": 5943 }, { "epoch": 0.16, "learning_rate": 1.9095718596793628e-05, "loss": 1.6113, "step": 5944 }, { "epoch": 0.16, "learning_rate": 1.9095351007197564e-05, "loss": 1.4629, "step": 5945 }, { "epoch": 0.16, "learning_rate": 1.9094983346443746e-05, "loss": 1.3677, "step": 5946 }, { "epoch": 0.16, "learning_rate": 1.909461561453506e-05, "loss": 1.5791, "step": 5947 }, { "epoch": 0.16, "learning_rate": 1.9094247811474375e-05, "loss": 1.5591, "step": 5948 }, { "epoch": 0.16, "learning_rate": 1.9093879937264575e-05, "loss": 1.3882, "step": 5949 }, { "epoch": 0.16, "learning_rate": 1.9093511991908534e-05, "loss": 1.4583, "step": 5950 }, { "epoch": 0.16, "learning_rate": 1.9093143975409128e-05, "loss": 1.4116, "step": 5951 }, { "epoch": 0.16, "learning_rate": 1.909277588776924e-05, "loss": 1.3818, "step": 5952 }, { "epoch": 0.16, "learning_rate": 1.9092407728991753e-05, "loss": 1.3892, "step": 5953 }, { "epoch": 0.16, "learning_rate": 1.909203949907954e-05, "loss": 1.4473, "step": 5954 }, { "epoch": 0.16, "learning_rate": 1.9091671198035486e-05, "loss": 1.3701, "step": 5955 }, { "epoch": 0.16, "learning_rate": 1.9091302825862474e-05, "loss": 1.4402, "step": 5956 }, { "epoch": 0.16, "learning_rate": 1.9090934382563383e-05, "loss": 1.4229, "step": 5957 }, { "epoch": 0.16, "learning_rate": 1.9090565868141097e-05, "loss": 1.4368, "step": 5958 }, { "epoch": 0.16, "learning_rate": 1.9090197282598493e-05, "loss": 1.5601, "step": 5959 }, { "epoch": 0.16, "learning_rate": 1.9089828625938464e-05, "loss": 1.4438, "step": 5960 }, { "epoch": 0.16, "learning_rate": 1.908945989816389e-05, "loss": 1.4141, "step": 5961 }, { "epoch": 0.16, "learning_rate": 1.9089091099277657e-05, "loss": 1.3606, "step": 5962 }, { "epoch": 0.16, "learning_rate": 1.9088722229282646e-05, "loss": 1.5078, "step": 5963 }, { "epoch": 0.16, "learning_rate": 1.908835328818175e-05, "loss": 1.4392, "step": 5964 }, { "epoch": 0.16, "learning_rate": 1.908798427597785e-05, "loss": 1.2512, "step": 5965 }, { "epoch": 0.16, "learning_rate": 1.9087615192673833e-05, "loss": 1.3071, "step": 5966 }, { "epoch": 0.16, "learning_rate": 1.908724603827259e-05, "loss": 1.3528, "step": 5967 }, { "epoch": 0.16, "learning_rate": 1.9086876812777003e-05, "loss": 1.4688, "step": 5968 }, { "epoch": 0.16, "learning_rate": 1.9086507516189966e-05, "loss": 1.5791, "step": 5969 }, { "epoch": 0.16, "learning_rate": 1.908613814851437e-05, "loss": 1.4604, "step": 5970 }, { "epoch": 0.16, "learning_rate": 1.9085768709753103e-05, "loss": 1.8657, "step": 5971 }, { "epoch": 0.16, "learning_rate": 1.908539919990905e-05, "loss": 1.3354, "step": 5972 }, { "epoch": 0.16, "learning_rate": 1.908502961898511e-05, "loss": 1.4868, "step": 5973 }, { "epoch": 0.16, "learning_rate": 1.9084659966984164e-05, "loss": 1.2825, "step": 5974 }, { "epoch": 0.16, "learning_rate": 1.9084290243909116e-05, "loss": 1.406, "step": 5975 }, { "epoch": 0.16, "learning_rate": 1.908392044976285e-05, "loss": 1.3533, "step": 5976 }, { "epoch": 0.16, "learning_rate": 1.9083550584548263e-05, "loss": 1.3, "step": 5977 }, { "epoch": 0.16, "learning_rate": 1.908318064826825e-05, "loss": 1.4189, "step": 5978 }, { "epoch": 0.16, "learning_rate": 1.9082810640925698e-05, "loss": 1.4824, "step": 5979 }, { "epoch": 0.16, "learning_rate": 1.908244056252351e-05, "loss": 1.2507, "step": 5980 }, { "epoch": 0.16, "learning_rate": 1.9082070413064574e-05, "loss": 1.3125, "step": 5981 }, { "epoch": 0.16, "learning_rate": 1.9081700192551796e-05, "loss": 1.3867, "step": 5982 }, { "epoch": 0.16, "learning_rate": 1.9081329900988064e-05, "loss": 1.3206, "step": 5983 }, { "epoch": 0.16, "learning_rate": 1.9080959538376276e-05, "loss": 1.3699, "step": 5984 }, { "epoch": 0.16, "learning_rate": 1.908058910471933e-05, "loss": 1.4819, "step": 5985 }, { "epoch": 0.16, "learning_rate": 1.9080218600020125e-05, "loss": 1.4858, "step": 5986 }, { "epoch": 0.16, "learning_rate": 1.907984802428156e-05, "loss": 1.3906, "step": 5987 }, { "epoch": 0.16, "learning_rate": 1.9079477377506535e-05, "loss": 1.2375, "step": 5988 }, { "epoch": 0.16, "learning_rate": 1.9079106659697945e-05, "loss": 1.4937, "step": 5989 }, { "epoch": 0.16, "learning_rate": 1.9078735870858696e-05, "loss": 1.4263, "step": 5990 }, { "epoch": 0.16, "learning_rate": 1.907836501099169e-05, "loss": 1.344, "step": 5991 }, { "epoch": 0.16, "learning_rate": 1.907799408009982e-05, "loss": 1.3435, "step": 5992 }, { "epoch": 0.16, "learning_rate": 1.9077623078185998e-05, "loss": 1.4312, "step": 5993 }, { "epoch": 0.16, "learning_rate": 1.907725200525312e-05, "loss": 1.3228, "step": 5994 }, { "epoch": 0.16, "learning_rate": 1.9076880861304086e-05, "loss": 1.4128, "step": 5995 }, { "epoch": 0.16, "learning_rate": 1.9076509646341806e-05, "loss": 1.1765, "step": 5996 }, { "epoch": 0.16, "learning_rate": 1.9076138360369184e-05, "loss": 1.4307, "step": 5997 }, { "epoch": 0.16, "learning_rate": 1.9075767003389125e-05, "loss": 1.457, "step": 5998 }, { "epoch": 0.16, "learning_rate": 1.907539557540453e-05, "loss": 1.2261, "step": 5999 }, { "epoch": 0.16, "learning_rate": 1.907502407641831e-05, "loss": 1.3713, "step": 6000 }, { "epoch": 0.16, "learning_rate": 1.907465250643337e-05, "loss": 1.4775, "step": 6001 }, { "epoch": 0.16, "learning_rate": 1.9074280865452614e-05, "loss": 1.3201, "step": 6002 }, { "epoch": 0.16, "learning_rate": 1.907390915347895e-05, "loss": 1.4146, "step": 6003 }, { "epoch": 0.16, "learning_rate": 1.907353737051529e-05, "loss": 1.3892, "step": 6004 }, { "epoch": 0.16, "learning_rate": 1.9073165516564537e-05, "loss": 1.2446, "step": 6005 }, { "epoch": 0.16, "learning_rate": 1.907279359162961e-05, "loss": 1.2798, "step": 6006 }, { "epoch": 0.16, "learning_rate": 1.9072421595713404e-05, "loss": 1.23, "step": 6007 }, { "epoch": 0.16, "learning_rate": 1.9072049528818844e-05, "loss": 1.3726, "step": 6008 }, { "epoch": 0.16, "learning_rate": 1.9071677390948832e-05, "loss": 1.3799, "step": 6009 }, { "epoch": 0.16, "learning_rate": 1.907130518210628e-05, "loss": 1.3892, "step": 6010 }, { "epoch": 0.16, "learning_rate": 1.9070932902294107e-05, "loss": 1.2937, "step": 6011 }, { "epoch": 0.16, "learning_rate": 1.9070560551515214e-05, "loss": 1.3091, "step": 6012 }, { "epoch": 0.16, "learning_rate": 1.9070188129772525e-05, "loss": 1.5444, "step": 6013 }, { "epoch": 0.16, "learning_rate": 1.906981563706895e-05, "loss": 1.3921, "step": 6014 }, { "epoch": 0.16, "learning_rate": 1.9069443073407397e-05, "loss": 1.5513, "step": 6015 }, { "epoch": 0.16, "learning_rate": 1.906907043879079e-05, "loss": 1.1677, "step": 6016 }, { "epoch": 0.16, "learning_rate": 1.906869773322204e-05, "loss": 1.2795, "step": 6017 }, { "epoch": 0.16, "learning_rate": 1.9068324956704067e-05, "loss": 1.5117, "step": 6018 }, { "epoch": 0.16, "learning_rate": 1.906795210923978e-05, "loss": 1.4307, "step": 6019 }, { "epoch": 0.16, "learning_rate": 1.90675791908321e-05, "loss": 1.4656, "step": 6020 }, { "epoch": 0.16, "learning_rate": 1.9067206201483943e-05, "loss": 1.459, "step": 6021 }, { "epoch": 0.16, "learning_rate": 1.906683314119823e-05, "loss": 1.4297, "step": 6022 }, { "epoch": 0.16, "learning_rate": 1.9066460009977877e-05, "loss": 1.4971, "step": 6023 }, { "epoch": 0.16, "learning_rate": 1.9066086807825807e-05, "loss": 1.4939, "step": 6024 }, { "epoch": 0.16, "learning_rate": 1.9065713534744935e-05, "loss": 1.4375, "step": 6025 }, { "epoch": 0.16, "learning_rate": 1.906534019073818e-05, "loss": 1.3911, "step": 6026 }, { "epoch": 0.16, "learning_rate": 1.9064966775808472e-05, "loss": 1.4446, "step": 6027 }, { "epoch": 0.16, "learning_rate": 1.9064593289958725e-05, "loss": 1.4614, "step": 6028 }, { "epoch": 0.16, "learning_rate": 1.906421973319186e-05, "loss": 1.3389, "step": 6029 }, { "epoch": 0.16, "learning_rate": 1.9063846105510803e-05, "loss": 1.2852, "step": 6030 }, { "epoch": 0.16, "learning_rate": 1.9063472406918478e-05, "loss": 1.5305, "step": 6031 }, { "epoch": 0.16, "learning_rate": 1.9063098637417804e-05, "loss": 1.4031, "step": 6032 }, { "epoch": 0.16, "learning_rate": 1.906272479701171e-05, "loss": 1.3164, "step": 6033 }, { "epoch": 0.16, "learning_rate": 1.9062350885703117e-05, "loss": 1.4028, "step": 6034 }, { "epoch": 0.16, "learning_rate": 1.9061976903494956e-05, "loss": 1.4548, "step": 6035 }, { "epoch": 0.16, "learning_rate": 1.9061602850390145e-05, "loss": 1.4622, "step": 6036 }, { "epoch": 0.16, "learning_rate": 1.906122872639162e-05, "loss": 1.2761, "step": 6037 }, { "epoch": 0.16, "learning_rate": 1.9060854531502295e-05, "loss": 1.4192, "step": 6038 }, { "epoch": 0.16, "learning_rate": 1.9060480265725108e-05, "loss": 1.24, "step": 6039 }, { "epoch": 0.16, "learning_rate": 1.9060105929062983e-05, "loss": 1.3862, "step": 6040 }, { "epoch": 0.16, "learning_rate": 1.905973152151885e-05, "loss": 1.4915, "step": 6041 }, { "epoch": 0.17, "learning_rate": 1.9059357043095642e-05, "loss": 1.2793, "step": 6042 }, { "epoch": 0.17, "learning_rate": 1.905898249379628e-05, "loss": 1.3809, "step": 6043 }, { "epoch": 0.17, "learning_rate": 1.9058607873623697e-05, "loss": 1.4949, "step": 6044 }, { "epoch": 0.17, "learning_rate": 1.905823318258083e-05, "loss": 1.313, "step": 6045 }, { "epoch": 0.17, "learning_rate": 1.9057858420670607e-05, "loss": 1.384, "step": 6046 }, { "epoch": 0.17, "learning_rate": 1.9057483587895955e-05, "loss": 1.2793, "step": 6047 }, { "epoch": 0.17, "learning_rate": 1.905710868425981e-05, "loss": 1.3503, "step": 6048 }, { "epoch": 0.17, "learning_rate": 1.9056733709765106e-05, "loss": 1.3853, "step": 6049 }, { "epoch": 0.17, "learning_rate": 1.905635866441478e-05, "loss": 1.3491, "step": 6050 }, { "epoch": 0.17, "learning_rate": 1.905598354821176e-05, "loss": 1.4365, "step": 6051 }, { "epoch": 0.17, "learning_rate": 1.9055608361158985e-05, "loss": 1.4668, "step": 6052 }, { "epoch": 0.17, "learning_rate": 1.9055233103259385e-05, "loss": 1.4551, "step": 6053 }, { "epoch": 0.17, "learning_rate": 1.90548577745159e-05, "loss": 1.1768, "step": 6054 }, { "epoch": 0.17, "learning_rate": 1.905448237493147e-05, "loss": 1.3521, "step": 6055 }, { "epoch": 0.17, "learning_rate": 1.9054106904509023e-05, "loss": 1.4021, "step": 6056 }, { "epoch": 0.17, "learning_rate": 1.90537313632515e-05, "loss": 1.3389, "step": 6057 }, { "epoch": 0.17, "learning_rate": 1.9053355751161845e-05, "loss": 1.4021, "step": 6058 }, { "epoch": 0.17, "learning_rate": 1.905298006824299e-05, "loss": 1.2615, "step": 6059 }, { "epoch": 0.17, "learning_rate": 1.9052604314497874e-05, "loss": 1.5063, "step": 6060 }, { "epoch": 0.17, "learning_rate": 1.9052228489929437e-05, "loss": 1.4551, "step": 6061 }, { "epoch": 0.17, "learning_rate": 1.9051852594540627e-05, "loss": 1.4045, "step": 6062 }, { "epoch": 0.17, "learning_rate": 1.9051476628334376e-05, "loss": 1.4192, "step": 6063 }, { "epoch": 0.17, "learning_rate": 1.9051100591313627e-05, "loss": 1.4907, "step": 6064 }, { "epoch": 0.17, "learning_rate": 1.9050724483481323e-05, "loss": 1.4868, "step": 6065 }, { "epoch": 0.17, "learning_rate": 1.905034830484041e-05, "loss": 1.4419, "step": 6066 }, { "epoch": 0.17, "learning_rate": 1.9049972055393823e-05, "loss": 1.3501, "step": 6067 }, { "epoch": 0.17, "learning_rate": 1.9049595735144514e-05, "loss": 1.3403, "step": 6068 }, { "epoch": 0.17, "learning_rate": 1.904921934409542e-05, "loss": 1.4197, "step": 6069 }, { "epoch": 0.17, "learning_rate": 1.9048842882249495e-05, "loss": 1.4263, "step": 6070 }, { "epoch": 0.17, "learning_rate": 1.904846634960967e-05, "loss": 1.7031, "step": 6071 }, { "epoch": 0.17, "learning_rate": 1.9048089746178907e-05, "loss": 1.3711, "step": 6072 }, { "epoch": 0.17, "learning_rate": 1.9047713071960138e-05, "loss": 1.3887, "step": 6073 }, { "epoch": 0.17, "learning_rate": 1.9047336326956322e-05, "loss": 1.345, "step": 6074 }, { "epoch": 0.17, "learning_rate": 1.9046959511170398e-05, "loss": 1.2837, "step": 6075 }, { "epoch": 0.17, "learning_rate": 1.9046582624605316e-05, "loss": 1.5669, "step": 6076 }, { "epoch": 0.17, "learning_rate": 1.904620566726403e-05, "loss": 1.2803, "step": 6077 }, { "epoch": 0.17, "learning_rate": 1.9045828639149476e-05, "loss": 1.4512, "step": 6078 }, { "epoch": 0.17, "learning_rate": 1.9045451540264622e-05, "loss": 1.3894, "step": 6079 }, { "epoch": 0.17, "learning_rate": 1.9045074370612406e-05, "loss": 1.4417, "step": 6080 }, { "epoch": 0.17, "learning_rate": 1.9044697130195777e-05, "loss": 1.4807, "step": 6081 }, { "epoch": 0.17, "learning_rate": 1.9044319819017694e-05, "loss": 1.4631, "step": 6082 }, { "epoch": 0.17, "learning_rate": 1.9043942437081107e-05, "loss": 1.3357, "step": 6083 }, { "epoch": 0.17, "learning_rate": 1.9043564984388965e-05, "loss": 1.4607, "step": 6084 }, { "epoch": 0.17, "learning_rate": 1.9043187460944222e-05, "loss": 1.2791, "step": 6085 }, { "epoch": 0.17, "learning_rate": 1.9042809866749836e-05, "loss": 1.4932, "step": 6086 }, { "epoch": 0.17, "learning_rate": 1.9042432201808757e-05, "loss": 1.4722, "step": 6087 }, { "epoch": 0.17, "learning_rate": 1.9042054466123938e-05, "loss": 1.2856, "step": 6088 }, { "epoch": 0.17, "learning_rate": 1.9041676659698338e-05, "loss": 1.3945, "step": 6089 }, { "epoch": 0.17, "learning_rate": 1.904129878253491e-05, "loss": 1.4529, "step": 6090 }, { "epoch": 0.17, "learning_rate": 1.9040920834636617e-05, "loss": 1.5083, "step": 6091 }, { "epoch": 0.17, "learning_rate": 1.9040542816006408e-05, "loss": 1.5952, "step": 6092 }, { "epoch": 0.17, "learning_rate": 1.9040164726647244e-05, "loss": 1.3721, "step": 6093 }, { "epoch": 0.17, "learning_rate": 1.903978656656208e-05, "loss": 1.2676, "step": 6094 }, { "epoch": 0.17, "learning_rate": 1.9039408335753877e-05, "loss": 1.7007, "step": 6095 }, { "epoch": 0.17, "learning_rate": 1.9039030034225593e-05, "loss": 1.4819, "step": 6096 }, { "epoch": 0.17, "learning_rate": 1.9038651661980193e-05, "loss": 1.3955, "step": 6097 }, { "epoch": 0.17, "learning_rate": 1.9038273219020626e-05, "loss": 1.3074, "step": 6098 }, { "epoch": 0.17, "learning_rate": 1.9037894705349864e-05, "loss": 1.4175, "step": 6099 }, { "epoch": 0.17, "learning_rate": 1.9037516120970863e-05, "loss": 1.6011, "step": 6100 }, { "epoch": 0.17, "learning_rate": 1.9037137465886585e-05, "loss": 1.292, "step": 6101 }, { "epoch": 0.17, "learning_rate": 1.9036758740099993e-05, "loss": 1.3103, "step": 6102 }, { "epoch": 0.17, "learning_rate": 1.903637994361405e-05, "loss": 1.447, "step": 6103 }, { "epoch": 0.17, "learning_rate": 1.903600107643172e-05, "loss": 1.3823, "step": 6104 }, { "epoch": 0.17, "learning_rate": 1.903562213855597e-05, "loss": 1.5762, "step": 6105 }, { "epoch": 0.17, "learning_rate": 1.9035243129989757e-05, "loss": 1.5381, "step": 6106 }, { "epoch": 0.17, "learning_rate": 1.903486405073605e-05, "loss": 1.3757, "step": 6107 }, { "epoch": 0.17, "learning_rate": 1.9034484900797816e-05, "loss": 1.2991, "step": 6108 }, { "epoch": 0.17, "learning_rate": 1.9034105680178022e-05, "loss": 1.1738, "step": 6109 }, { "epoch": 0.17, "learning_rate": 1.903372638887963e-05, "loss": 1.4697, "step": 6110 }, { "epoch": 0.17, "learning_rate": 1.9033347026905617e-05, "loss": 1.481, "step": 6111 }, { "epoch": 0.17, "learning_rate": 1.9032967594258938e-05, "loss": 1.4817, "step": 6112 }, { "epoch": 0.17, "learning_rate": 1.903258809094257e-05, "loss": 1.3701, "step": 6113 }, { "epoch": 0.17, "learning_rate": 1.903220851695948e-05, "loss": 1.4802, "step": 6114 }, { "epoch": 0.17, "learning_rate": 1.903182887231264e-05, "loss": 1.3733, "step": 6115 }, { "epoch": 0.17, "learning_rate": 1.9031449157005017e-05, "loss": 1.1926, "step": 6116 }, { "epoch": 0.17, "learning_rate": 1.903106937103958e-05, "loss": 1.2522, "step": 6117 }, { "epoch": 0.17, "learning_rate": 1.9030689514419305e-05, "loss": 1.5127, "step": 6118 }, { "epoch": 0.17, "learning_rate": 1.9030309587147163e-05, "loss": 1.5571, "step": 6119 }, { "epoch": 0.17, "learning_rate": 1.9029929589226125e-05, "loss": 1.3003, "step": 6120 }, { "epoch": 0.17, "learning_rate": 1.9029549520659164e-05, "loss": 1.4941, "step": 6121 }, { "epoch": 0.17, "learning_rate": 1.902916938144925e-05, "loss": 1.5054, "step": 6122 }, { "epoch": 0.17, "learning_rate": 1.9028789171599364e-05, "loss": 1.4355, "step": 6123 }, { "epoch": 0.17, "learning_rate": 1.902840889111248e-05, "loss": 1.2871, "step": 6124 }, { "epoch": 0.17, "learning_rate": 1.9028028539991562e-05, "loss": 1.3071, "step": 6125 }, { "epoch": 0.17, "learning_rate": 1.90276481182396e-05, "loss": 1.4102, "step": 6126 }, { "epoch": 0.17, "learning_rate": 1.9027267625859563e-05, "loss": 1.3794, "step": 6127 }, { "epoch": 0.17, "learning_rate": 1.902688706285443e-05, "loss": 1.2881, "step": 6128 }, { "epoch": 0.17, "learning_rate": 1.9026506429227174e-05, "loss": 1.4102, "step": 6129 }, { "epoch": 0.17, "learning_rate": 1.902612572498078e-05, "loss": 1.4517, "step": 6130 }, { "epoch": 0.17, "learning_rate": 1.902574495011822e-05, "loss": 1.4233, "step": 6131 }, { "epoch": 0.17, "learning_rate": 1.9025364104642478e-05, "loss": 1.3787, "step": 6132 }, { "epoch": 0.17, "learning_rate": 1.902498318855653e-05, "loss": 1.3999, "step": 6133 }, { "epoch": 0.17, "learning_rate": 1.9024602201863357e-05, "loss": 1.241, "step": 6134 }, { "epoch": 0.17, "learning_rate": 1.9024221144565943e-05, "loss": 1.4353, "step": 6135 }, { "epoch": 0.17, "learning_rate": 1.9023840016667262e-05, "loss": 1.3674, "step": 6136 }, { "epoch": 0.17, "learning_rate": 1.9023458818170303e-05, "loss": 1.4307, "step": 6137 }, { "epoch": 0.17, "learning_rate": 1.9023077549078044e-05, "loss": 1.2744, "step": 6138 }, { "epoch": 0.17, "learning_rate": 1.902269620939347e-05, "loss": 1.3506, "step": 6139 }, { "epoch": 0.17, "learning_rate": 1.902231479911956e-05, "loss": 1.365, "step": 6140 }, { "epoch": 0.17, "learning_rate": 1.9021933318259306e-05, "loss": 1.4368, "step": 6141 }, { "epoch": 0.17, "learning_rate": 1.902155176681569e-05, "loss": 1.3425, "step": 6142 }, { "epoch": 0.17, "learning_rate": 1.9021170144791688e-05, "loss": 1.4502, "step": 6143 }, { "epoch": 0.17, "learning_rate": 1.9020788452190297e-05, "loss": 1.531, "step": 6144 }, { "epoch": 0.17, "learning_rate": 1.90204066890145e-05, "loss": 1.543, "step": 6145 }, { "epoch": 0.17, "learning_rate": 1.902002485526728e-05, "loss": 1.3345, "step": 6146 }, { "epoch": 0.17, "learning_rate": 1.901964295095163e-05, "loss": 1.3684, "step": 6147 }, { "epoch": 0.17, "learning_rate": 1.9019260976070532e-05, "loss": 1.5293, "step": 6148 }, { "epoch": 0.17, "learning_rate": 1.901887893062698e-05, "loss": 1.3257, "step": 6149 }, { "epoch": 0.17, "learning_rate": 1.901849681462396e-05, "loss": 1.4121, "step": 6150 }, { "epoch": 0.17, "learning_rate": 1.9018114628064463e-05, "loss": 1.3853, "step": 6151 }, { "epoch": 0.17, "learning_rate": 1.9017732370951472e-05, "loss": 1.5498, "step": 6152 }, { "epoch": 0.17, "learning_rate": 1.9017350043287987e-05, "loss": 1.304, "step": 6153 }, { "epoch": 0.17, "learning_rate": 1.9016967645076997e-05, "loss": 1.46, "step": 6154 }, { "epoch": 0.17, "learning_rate": 1.9016585176321488e-05, "loss": 1.521, "step": 6155 }, { "epoch": 0.17, "learning_rate": 1.9016202637024462e-05, "loss": 1.2729, "step": 6156 }, { "epoch": 0.17, "learning_rate": 1.9015820027188904e-05, "loss": 1.4604, "step": 6157 }, { "epoch": 0.17, "learning_rate": 1.9015437346817805e-05, "loss": 1.3027, "step": 6158 }, { "epoch": 0.17, "learning_rate": 1.9015054595914168e-05, "loss": 1.5444, "step": 6159 }, { "epoch": 0.17, "learning_rate": 1.9014671774480984e-05, "loss": 1.5073, "step": 6160 }, { "epoch": 0.17, "learning_rate": 1.9014288882521245e-05, "loss": 1.4424, "step": 6161 }, { "epoch": 0.17, "learning_rate": 1.9013905920037953e-05, "loss": 1.5, "step": 6162 }, { "epoch": 0.17, "learning_rate": 1.9013522887034092e-05, "loss": 1.5044, "step": 6163 }, { "epoch": 0.17, "learning_rate": 1.9013139783512672e-05, "loss": 1.1824, "step": 6164 }, { "epoch": 0.17, "learning_rate": 1.9012756609476684e-05, "loss": 1.7036, "step": 6165 }, { "epoch": 0.17, "learning_rate": 1.9012373364929123e-05, "loss": 1.384, "step": 6166 }, { "epoch": 0.17, "learning_rate": 1.901199004987299e-05, "loss": 1.4233, "step": 6167 }, { "epoch": 0.17, "learning_rate": 1.901160666431129e-05, "loss": 1.7334, "step": 6168 }, { "epoch": 0.17, "learning_rate": 1.9011223208247016e-05, "loss": 1.5874, "step": 6169 }, { "epoch": 0.17, "learning_rate": 1.9010839681683166e-05, "loss": 1.3799, "step": 6170 }, { "epoch": 0.17, "learning_rate": 1.901045608462275e-05, "loss": 1.3462, "step": 6171 }, { "epoch": 0.17, "learning_rate": 1.9010072417068753e-05, "loss": 1.4075, "step": 6172 }, { "epoch": 0.17, "learning_rate": 1.900968867902419e-05, "loss": 1.3896, "step": 6173 }, { "epoch": 0.17, "learning_rate": 1.9009304870492062e-05, "loss": 1.4451, "step": 6174 }, { "epoch": 0.17, "learning_rate": 1.9008920991475367e-05, "loss": 1.4951, "step": 6175 }, { "epoch": 0.17, "learning_rate": 1.9008537041977114e-05, "loss": 1.3701, "step": 6176 }, { "epoch": 0.17, "learning_rate": 1.90081530220003e-05, "loss": 1.4556, "step": 6177 }, { "epoch": 0.17, "learning_rate": 1.9007768931547933e-05, "loss": 1.4099, "step": 6178 }, { "epoch": 0.17, "learning_rate": 1.900738477062302e-05, "loss": 1.2222, "step": 6179 }, { "epoch": 0.17, "learning_rate": 1.900700053922856e-05, "loss": 1.2563, "step": 6180 }, { "epoch": 0.17, "learning_rate": 1.9006616237367565e-05, "loss": 1.5366, "step": 6181 }, { "epoch": 0.17, "learning_rate": 1.900623186504304e-05, "loss": 1.2759, "step": 6182 }, { "epoch": 0.17, "learning_rate": 1.900584742225799e-05, "loss": 1.2427, "step": 6183 }, { "epoch": 0.17, "learning_rate": 1.9005462909015426e-05, "loss": 1.4504, "step": 6184 }, { "epoch": 0.17, "learning_rate": 1.9005078325318357e-05, "loss": 1.418, "step": 6185 }, { "epoch": 0.17, "learning_rate": 1.9004693671169787e-05, "loss": 1.2278, "step": 6186 }, { "epoch": 0.17, "learning_rate": 1.9004308946572728e-05, "loss": 1.4573, "step": 6187 }, { "epoch": 0.17, "learning_rate": 1.9003924151530195e-05, "loss": 1.3123, "step": 6188 }, { "epoch": 0.17, "learning_rate": 1.9003539286045186e-05, "loss": 1.5071, "step": 6189 }, { "epoch": 0.17, "learning_rate": 1.9003154350120722e-05, "loss": 1.459, "step": 6190 }, { "epoch": 0.17, "learning_rate": 1.9002769343759813e-05, "loss": 1.2944, "step": 6191 }, { "epoch": 0.17, "learning_rate": 1.9002384266965472e-05, "loss": 1.3668, "step": 6192 }, { "epoch": 0.17, "learning_rate": 1.9001999119740703e-05, "loss": 1.2207, "step": 6193 }, { "epoch": 0.17, "learning_rate": 1.900161390208853e-05, "loss": 1.3555, "step": 6194 }, { "epoch": 0.17, "learning_rate": 1.9001228614011964e-05, "loss": 1.2871, "step": 6195 }, { "epoch": 0.17, "learning_rate": 1.9000843255514018e-05, "loss": 1.4338, "step": 6196 }, { "epoch": 0.17, "learning_rate": 1.9000457826597706e-05, "loss": 1.407, "step": 6197 }, { "epoch": 0.17, "learning_rate": 1.9000072327266044e-05, "loss": 1.1851, "step": 6198 }, { "epoch": 0.17, "learning_rate": 1.8999686757522048e-05, "loss": 1.4312, "step": 6199 }, { "epoch": 0.17, "learning_rate": 1.8999301117368736e-05, "loss": 1.3611, "step": 6200 }, { "epoch": 0.17, "learning_rate": 1.899891540680912e-05, "loss": 1.324, "step": 6201 }, { "epoch": 0.17, "learning_rate": 1.8998529625846225e-05, "loss": 1.3413, "step": 6202 }, { "epoch": 0.17, "learning_rate": 1.8998143774483065e-05, "loss": 1.3057, "step": 6203 }, { "epoch": 0.17, "learning_rate": 1.899775785272266e-05, "loss": 1.3174, "step": 6204 }, { "epoch": 0.17, "learning_rate": 1.899737186056803e-05, "loss": 1.3555, "step": 6205 }, { "epoch": 0.17, "learning_rate": 1.8996985798022188e-05, "loss": 1.3032, "step": 6206 }, { "epoch": 0.17, "learning_rate": 1.8996599665088164e-05, "loss": 1.3384, "step": 6207 }, { "epoch": 0.17, "learning_rate": 1.8996213461768975e-05, "loss": 1.3254, "step": 6208 }, { "epoch": 0.17, "learning_rate": 1.899582718806764e-05, "loss": 1.8613, "step": 6209 }, { "epoch": 0.17, "learning_rate": 1.8995440843987187e-05, "loss": 1.3303, "step": 6210 }, { "epoch": 0.17, "learning_rate": 1.899505442953063e-05, "loss": 1.5071, "step": 6211 }, { "epoch": 0.17, "learning_rate": 1.8994667944701e-05, "loss": 1.4478, "step": 6212 }, { "epoch": 0.17, "learning_rate": 1.8994281389501314e-05, "loss": 1.4048, "step": 6213 }, { "epoch": 0.17, "learning_rate": 1.8993894763934602e-05, "loss": 1.2686, "step": 6214 }, { "epoch": 0.17, "learning_rate": 1.8993508068003887e-05, "loss": 1.4326, "step": 6215 }, { "epoch": 0.17, "learning_rate": 1.8993121301712194e-05, "loss": 1.4741, "step": 6216 }, { "epoch": 0.17, "learning_rate": 1.8992734465062547e-05, "loss": 1.4036, "step": 6217 }, { "epoch": 0.17, "learning_rate": 1.8992347558057977e-05, "loss": 1.2708, "step": 6218 }, { "epoch": 0.17, "learning_rate": 1.8991960580701507e-05, "loss": 1.5613, "step": 6219 }, { "epoch": 0.17, "learning_rate": 1.8991573532996165e-05, "loss": 1.4729, "step": 6220 }, { "epoch": 0.17, "learning_rate": 1.8991186414944982e-05, "loss": 1.5078, "step": 6221 }, { "epoch": 0.17, "learning_rate": 1.899079922655098e-05, "loss": 1.4219, "step": 6222 }, { "epoch": 0.17, "learning_rate": 1.89904119678172e-05, "loss": 1.3716, "step": 6223 }, { "epoch": 0.17, "learning_rate": 1.899002463874666e-05, "loss": 1.4717, "step": 6224 }, { "epoch": 0.17, "learning_rate": 1.8989637239342393e-05, "loss": 1.2837, "step": 6225 }, { "epoch": 0.17, "learning_rate": 1.8989249769607433e-05, "loss": 1.26, "step": 6226 }, { "epoch": 0.17, "learning_rate": 1.898886222954481e-05, "loss": 1.446, "step": 6227 }, { "epoch": 0.17, "learning_rate": 1.8988474619157556e-05, "loss": 1.4128, "step": 6228 }, { "epoch": 0.17, "learning_rate": 1.89880869384487e-05, "loss": 1.3286, "step": 6229 }, { "epoch": 0.17, "learning_rate": 1.8987699187421285e-05, "loss": 1.4688, "step": 6230 }, { "epoch": 0.17, "learning_rate": 1.8987311366078333e-05, "loss": 1.4492, "step": 6231 }, { "epoch": 0.17, "learning_rate": 1.8986923474422885e-05, "loss": 1.2939, "step": 6232 }, { "epoch": 0.17, "learning_rate": 1.898653551245797e-05, "loss": 1.4998, "step": 6233 }, { "epoch": 0.17, "learning_rate": 1.8986147480186633e-05, "loss": 1.7559, "step": 6234 }, { "epoch": 0.17, "learning_rate": 1.8985759377611897e-05, "loss": 1.4919, "step": 6235 }, { "epoch": 0.17, "learning_rate": 1.898537120473681e-05, "loss": 1.458, "step": 6236 }, { "epoch": 0.17, "learning_rate": 1.8984982961564405e-05, "loss": 1.4238, "step": 6237 }, { "epoch": 0.17, "learning_rate": 1.8984594648097713e-05, "loss": 1.249, "step": 6238 }, { "epoch": 0.17, "learning_rate": 1.898420626433978e-05, "loss": 1.2737, "step": 6239 }, { "epoch": 0.17, "learning_rate": 1.8983817810293645e-05, "loss": 1.2368, "step": 6240 }, { "epoch": 0.17, "learning_rate": 1.898342928596234e-05, "loss": 1.2034, "step": 6241 }, { "epoch": 0.17, "learning_rate": 1.898304069134891e-05, "loss": 1.645, "step": 6242 }, { "epoch": 0.17, "learning_rate": 1.8982652026456392e-05, "loss": 1.311, "step": 6243 }, { "epoch": 0.17, "learning_rate": 1.898226329128783e-05, "loss": 1.4126, "step": 6244 }, { "epoch": 0.17, "learning_rate": 1.898187448584626e-05, "loss": 1.375, "step": 6245 }, { "epoch": 0.17, "learning_rate": 1.8981485610134732e-05, "loss": 1.4746, "step": 6246 }, { "epoch": 0.17, "learning_rate": 1.8981096664156284e-05, "loss": 1.5356, "step": 6247 }, { "epoch": 0.17, "learning_rate": 1.898070764791396e-05, "loss": 1.437, "step": 6248 }, { "epoch": 0.17, "learning_rate": 1.89803185614108e-05, "loss": 1.5713, "step": 6249 }, { "epoch": 0.17, "learning_rate": 1.8979929404649852e-05, "loss": 1.2903, "step": 6250 }, { "epoch": 0.17, "learning_rate": 1.8979540177634155e-05, "loss": 1.4155, "step": 6251 }, { "epoch": 0.17, "learning_rate": 1.8979150880366763e-05, "loss": 1.4048, "step": 6252 }, { "epoch": 0.17, "learning_rate": 1.8978761512850713e-05, "loss": 1.449, "step": 6253 }, { "epoch": 0.17, "learning_rate": 1.897837207508906e-05, "loss": 1.4417, "step": 6254 }, { "epoch": 0.17, "learning_rate": 1.897798256708484e-05, "loss": 1.3909, "step": 6255 }, { "epoch": 0.17, "learning_rate": 1.8977592988841107e-05, "loss": 1.5293, "step": 6256 }, { "epoch": 0.17, "learning_rate": 1.897720334036091e-05, "loss": 1.4009, "step": 6257 }, { "epoch": 0.17, "learning_rate": 1.8976813621647295e-05, "loss": 1.3604, "step": 6258 }, { "epoch": 0.17, "learning_rate": 1.897642383270331e-05, "loss": 1.582, "step": 6259 }, { "epoch": 0.17, "learning_rate": 1.8976033973532008e-05, "loss": 1.3005, "step": 6260 }, { "epoch": 0.17, "learning_rate": 1.8975644044136436e-05, "loss": 1.386, "step": 6261 }, { "epoch": 0.17, "learning_rate": 1.8975254044519647e-05, "loss": 1.5264, "step": 6262 }, { "epoch": 0.17, "learning_rate": 1.897486397468469e-05, "loss": 1.4143, "step": 6263 }, { "epoch": 0.17, "learning_rate": 1.8974473834634616e-05, "loss": 1.3105, "step": 6264 }, { "epoch": 0.17, "learning_rate": 1.8974083624372484e-05, "loss": 1.3984, "step": 6265 }, { "epoch": 0.17, "learning_rate": 1.8973693343901335e-05, "loss": 1.4917, "step": 6266 }, { "epoch": 0.17, "learning_rate": 1.8973302993224233e-05, "loss": 1.3013, "step": 6267 }, { "epoch": 0.17, "learning_rate": 1.8972912572344227e-05, "loss": 1.3621, "step": 6268 }, { "epoch": 0.17, "learning_rate": 1.897252208126437e-05, "loss": 1.3171, "step": 6269 }, { "epoch": 0.17, "learning_rate": 1.8972131519987725e-05, "loss": 1.8096, "step": 6270 }, { "epoch": 0.17, "learning_rate": 1.8971740888517337e-05, "loss": 1.4438, "step": 6271 }, { "epoch": 0.17, "learning_rate": 1.897135018685627e-05, "loss": 1.3647, "step": 6272 }, { "epoch": 0.17, "learning_rate": 1.8970959415007577e-05, "loss": 1.3877, "step": 6273 }, { "epoch": 0.17, "learning_rate": 1.8970568572974316e-05, "loss": 1.4443, "step": 6274 }, { "epoch": 0.17, "learning_rate": 1.8970177660759544e-05, "loss": 1.3621, "step": 6275 }, { "epoch": 0.17, "learning_rate": 1.8969786678366317e-05, "loss": 1.3738, "step": 6276 }, { "epoch": 0.17, "learning_rate": 1.89693956257977e-05, "loss": 1.2837, "step": 6277 }, { "epoch": 0.17, "learning_rate": 1.8969004503056752e-05, "loss": 1.418, "step": 6278 }, { "epoch": 0.17, "learning_rate": 1.8968613310146527e-05, "loss": 1.5098, "step": 6279 }, { "epoch": 0.17, "learning_rate": 1.896822204707009e-05, "loss": 1.342, "step": 6280 }, { "epoch": 0.17, "learning_rate": 1.89678307138305e-05, "loss": 1.4368, "step": 6281 }, { "epoch": 0.17, "learning_rate": 1.8967439310430823e-05, "loss": 1.5239, "step": 6282 }, { "epoch": 0.17, "learning_rate": 1.8967047836874114e-05, "loss": 1.4373, "step": 6283 }, { "epoch": 0.17, "learning_rate": 1.8966656293163438e-05, "loss": 1.3582, "step": 6284 }, { "epoch": 0.17, "learning_rate": 1.8966264679301863e-05, "loss": 1.3152, "step": 6285 }, { "epoch": 0.17, "learning_rate": 1.8965872995292445e-05, "loss": 1.1692, "step": 6286 }, { "epoch": 0.17, "learning_rate": 1.8965481241138257e-05, "loss": 1.439, "step": 6287 }, { "epoch": 0.17, "learning_rate": 1.8965089416842358e-05, "loss": 1.2903, "step": 6288 }, { "epoch": 0.17, "learning_rate": 1.8964697522407814e-05, "loss": 1.3762, "step": 6289 }, { "epoch": 0.17, "learning_rate": 1.8964305557837696e-05, "loss": 1.428, "step": 6290 }, { "epoch": 0.17, "learning_rate": 1.8963913523135062e-05, "loss": 1.4924, "step": 6291 }, { "epoch": 0.17, "learning_rate": 1.8963521418302986e-05, "loss": 1.2859, "step": 6292 }, { "epoch": 0.17, "learning_rate": 1.8963129243344533e-05, "loss": 1.365, "step": 6293 }, { "epoch": 0.17, "learning_rate": 1.896273699826277e-05, "loss": 1.283, "step": 6294 }, { "epoch": 0.17, "learning_rate": 1.8962344683060772e-05, "loss": 1.313, "step": 6295 }, { "epoch": 0.17, "learning_rate": 1.89619522977416e-05, "loss": 1.4541, "step": 6296 }, { "epoch": 0.17, "learning_rate": 1.896155984230833e-05, "loss": 1.2971, "step": 6297 }, { "epoch": 0.17, "learning_rate": 1.8961167316764024e-05, "loss": 1.3381, "step": 6298 }, { "epoch": 0.17, "learning_rate": 1.8960774721111764e-05, "loss": 1.543, "step": 6299 }, { "epoch": 0.17, "learning_rate": 1.8960382055354616e-05, "loss": 1.5422, "step": 6300 }, { "epoch": 0.17, "learning_rate": 1.895998931949565e-05, "loss": 1.3201, "step": 6301 }, { "epoch": 0.17, "learning_rate": 1.8959596513537942e-05, "loss": 1.519, "step": 6302 }, { "epoch": 0.17, "learning_rate": 1.8959203637484563e-05, "loss": 1.3062, "step": 6303 }, { "epoch": 0.17, "learning_rate": 1.895881069133859e-05, "loss": 1.385, "step": 6304 }, { "epoch": 0.17, "learning_rate": 1.8958417675103092e-05, "loss": 1.427, "step": 6305 }, { "epoch": 0.17, "learning_rate": 1.895802458878115e-05, "loss": 1.2347, "step": 6306 }, { "epoch": 0.17, "learning_rate": 1.8957631432375833e-05, "loss": 1.46, "step": 6307 }, { "epoch": 0.17, "learning_rate": 1.895723820589022e-05, "loss": 1.4346, "step": 6308 }, { "epoch": 0.17, "learning_rate": 1.8956844909327387e-05, "loss": 1.3865, "step": 6309 }, { "epoch": 0.17, "learning_rate": 1.8956451542690414e-05, "loss": 1.3252, "step": 6310 }, { "epoch": 0.17, "learning_rate": 1.8956058105982373e-05, "loss": 1.4883, "step": 6311 }, { "epoch": 0.17, "learning_rate": 1.8955664599206347e-05, "loss": 1.4744, "step": 6312 }, { "epoch": 0.17, "learning_rate": 1.8955271022365412e-05, "loss": 1.2964, "step": 6313 }, { "epoch": 0.17, "learning_rate": 1.895487737546265e-05, "loss": 1.7412, "step": 6314 }, { "epoch": 0.17, "learning_rate": 1.895448365850113e-05, "loss": 1.3442, "step": 6315 }, { "epoch": 0.17, "learning_rate": 1.8954089871483948e-05, "loss": 1.4409, "step": 6316 }, { "epoch": 0.17, "learning_rate": 1.8953696014414173e-05, "loss": 1.3657, "step": 6317 }, { "epoch": 0.17, "learning_rate": 1.8953302087294893e-05, "loss": 1.2957, "step": 6318 }, { "epoch": 0.17, "learning_rate": 1.895290809012919e-05, "loss": 1.4304, "step": 6319 }, { "epoch": 0.17, "learning_rate": 1.8952514022920143e-05, "loss": 1.7529, "step": 6320 }, { "epoch": 0.17, "learning_rate": 1.8952119885670833e-05, "loss": 1.4355, "step": 6321 }, { "epoch": 0.17, "learning_rate": 1.8951725678384346e-05, "loss": 1.4773, "step": 6322 }, { "epoch": 0.17, "learning_rate": 1.895133140106377e-05, "loss": 1.3042, "step": 6323 }, { "epoch": 0.17, "learning_rate": 1.8950937053712185e-05, "loss": 1.4072, "step": 6324 }, { "epoch": 0.17, "learning_rate": 1.8950542636332677e-05, "loss": 1.3267, "step": 6325 }, { "epoch": 0.17, "learning_rate": 1.8950148148928336e-05, "loss": 1.3367, "step": 6326 }, { "epoch": 0.17, "learning_rate": 1.894975359150224e-05, "loss": 1.4478, "step": 6327 }, { "epoch": 0.17, "learning_rate": 1.894935896405748e-05, "loss": 1.344, "step": 6328 }, { "epoch": 0.17, "learning_rate": 1.8948964266597148e-05, "loss": 1.5791, "step": 6329 }, { "epoch": 0.17, "learning_rate": 1.8948569499124324e-05, "loss": 1.4634, "step": 6330 }, { "epoch": 0.17, "learning_rate": 1.8948174661642102e-05, "loss": 1.4668, "step": 6331 }, { "epoch": 0.17, "learning_rate": 1.894777975415357e-05, "loss": 1.4878, "step": 6332 }, { "epoch": 0.17, "learning_rate": 1.8947384776661813e-05, "loss": 1.4529, "step": 6333 }, { "epoch": 0.17, "learning_rate": 1.894698972916993e-05, "loss": 1.4109, "step": 6334 }, { "epoch": 0.17, "learning_rate": 1.8946594611681e-05, "loss": 1.2737, "step": 6335 }, { "epoch": 0.17, "learning_rate": 1.8946199424198127e-05, "loss": 1.1855, "step": 6336 }, { "epoch": 0.17, "learning_rate": 1.8945804166724394e-05, "loss": 1.4778, "step": 6337 }, { "epoch": 0.17, "learning_rate": 1.8945408839262896e-05, "loss": 1.5002, "step": 6338 }, { "epoch": 0.17, "learning_rate": 1.8945013441816727e-05, "loss": 1.5386, "step": 6339 }, { "epoch": 0.17, "learning_rate": 1.8944617974388974e-05, "loss": 1.3237, "step": 6340 }, { "epoch": 0.17, "learning_rate": 1.8944222436982743e-05, "loss": 1.4531, "step": 6341 }, { "epoch": 0.17, "learning_rate": 1.8943826829601115e-05, "loss": 1.4089, "step": 6342 }, { "epoch": 0.17, "learning_rate": 1.8943431152247197e-05, "loss": 1.394, "step": 6343 }, { "epoch": 0.17, "learning_rate": 1.8943035404924077e-05, "loss": 1.4751, "step": 6344 }, { "epoch": 0.17, "learning_rate": 1.8942639587634854e-05, "loss": 1.3909, "step": 6345 }, { "epoch": 0.17, "learning_rate": 1.894224370038262e-05, "loss": 1.3831, "step": 6346 }, { "epoch": 0.17, "learning_rate": 1.894184774317048e-05, "loss": 1.6096, "step": 6347 }, { "epoch": 0.17, "learning_rate": 1.894145171600153e-05, "loss": 1.3611, "step": 6348 }, { "epoch": 0.17, "learning_rate": 1.8941055618878864e-05, "loss": 1.3127, "step": 6349 }, { "epoch": 0.17, "learning_rate": 1.894065945180558e-05, "loss": 1.4517, "step": 6350 }, { "epoch": 0.17, "learning_rate": 1.8940263214784785e-05, "loss": 1.3645, "step": 6351 }, { "epoch": 0.17, "learning_rate": 1.8939866907819574e-05, "loss": 1.4756, "step": 6352 }, { "epoch": 0.17, "learning_rate": 1.8939470530913047e-05, "loss": 1.3789, "step": 6353 }, { "epoch": 0.17, "learning_rate": 1.8939074084068307e-05, "loss": 1.4307, "step": 6354 }, { "epoch": 0.17, "learning_rate": 1.8938677567288454e-05, "loss": 1.5029, "step": 6355 }, { "epoch": 0.17, "learning_rate": 1.8938280980576592e-05, "loss": 1.3828, "step": 6356 }, { "epoch": 0.17, "learning_rate": 1.893788432393582e-05, "loss": 1.5659, "step": 6357 }, { "epoch": 0.17, "learning_rate": 1.8937487597369245e-05, "loss": 1.2922, "step": 6358 }, { "epoch": 0.17, "learning_rate": 1.893709080087997e-05, "loss": 1.4312, "step": 6359 }, { "epoch": 0.17, "learning_rate": 1.8936693934471103e-05, "loss": 1.5125, "step": 6360 }, { "epoch": 0.17, "learning_rate": 1.893629699814574e-05, "loss": 1.4458, "step": 6361 }, { "epoch": 0.17, "learning_rate": 1.8935899991906993e-05, "loss": 1.5571, "step": 6362 }, { "epoch": 0.17, "learning_rate": 1.893550291575797e-05, "loss": 1.397, "step": 6363 }, { "epoch": 0.17, "learning_rate": 1.8935105769701768e-05, "loss": 1.4841, "step": 6364 }, { "epoch": 0.17, "learning_rate": 1.89347085537415e-05, "loss": 1.2832, "step": 6365 }, { "epoch": 0.17, "learning_rate": 1.8934311267880278e-05, "loss": 1.5391, "step": 6366 }, { "epoch": 0.17, "learning_rate": 1.8933913912121206e-05, "loss": 1.5073, "step": 6367 }, { "epoch": 0.17, "learning_rate": 1.8933516486467388e-05, "loss": 1.4575, "step": 6368 }, { "epoch": 0.17, "learning_rate": 1.893311899092194e-05, "loss": 1.4548, "step": 6369 }, { "epoch": 0.17, "learning_rate": 1.8932721425487973e-05, "loss": 1.3179, "step": 6370 }, { "epoch": 0.17, "learning_rate": 1.893232379016859e-05, "loss": 1.3989, "step": 6371 }, { "epoch": 0.17, "learning_rate": 1.8931926084966907e-05, "loss": 1.3816, "step": 6372 }, { "epoch": 0.17, "learning_rate": 1.8931528309886035e-05, "loss": 1.3411, "step": 6373 }, { "epoch": 0.17, "learning_rate": 1.8931130464929084e-05, "loss": 1.3723, "step": 6374 }, { "epoch": 0.17, "learning_rate": 1.893073255009917e-05, "loss": 1.5181, "step": 6375 }, { "epoch": 0.17, "learning_rate": 1.8930334565399402e-05, "loss": 1.3557, "step": 6376 }, { "epoch": 0.17, "learning_rate": 1.8929936510832897e-05, "loss": 1.4492, "step": 6377 }, { "epoch": 0.17, "learning_rate": 1.892953838640277e-05, "loss": 1.3777, "step": 6378 }, { "epoch": 0.17, "learning_rate": 1.892914019211213e-05, "loss": 1.4695, "step": 6379 }, { "epoch": 0.17, "learning_rate": 1.8928741927964095e-05, "loss": 1.3694, "step": 6380 }, { "epoch": 0.17, "learning_rate": 1.8928343593961784e-05, "loss": 1.2078, "step": 6381 }, { "epoch": 0.17, "learning_rate": 1.8927945190108314e-05, "loss": 1.7471, "step": 6382 }, { "epoch": 0.17, "learning_rate": 1.8927546716406793e-05, "loss": 1.4771, "step": 6383 }, { "epoch": 0.17, "learning_rate": 1.8927148172860348e-05, "loss": 1.4426, "step": 6384 }, { "epoch": 0.17, "learning_rate": 1.8926749559472096e-05, "loss": 1.3408, "step": 6385 }, { "epoch": 0.17, "learning_rate": 1.8926350876245147e-05, "loss": 1.3621, "step": 6386 }, { "epoch": 0.17, "learning_rate": 1.8925952123182633e-05, "loss": 1.4805, "step": 6387 }, { "epoch": 0.17, "learning_rate": 1.892555330028766e-05, "loss": 1.3726, "step": 6388 }, { "epoch": 0.17, "learning_rate": 1.892515440756336e-05, "loss": 1.5156, "step": 6389 }, { "epoch": 0.17, "learning_rate": 1.8924755445012847e-05, "loss": 1.2773, "step": 6390 }, { "epoch": 0.17, "learning_rate": 1.8924356412639243e-05, "loss": 1.5039, "step": 6391 }, { "epoch": 0.17, "learning_rate": 1.8923957310445672e-05, "loss": 1.3809, "step": 6392 }, { "epoch": 0.17, "learning_rate": 1.8923558138435255e-05, "loss": 1.1492, "step": 6393 }, { "epoch": 0.17, "learning_rate": 1.8923158896611114e-05, "loss": 1.3369, "step": 6394 }, { "epoch": 0.17, "learning_rate": 1.892275958497638e-05, "loss": 1.4556, "step": 6395 }, { "epoch": 0.17, "learning_rate": 1.8922360203534164e-05, "loss": 1.3071, "step": 6396 }, { "epoch": 0.17, "learning_rate": 1.89219607522876e-05, "loss": 1.3801, "step": 6397 }, { "epoch": 0.17, "learning_rate": 1.892156123123981e-05, "loss": 1.4243, "step": 6398 }, { "epoch": 0.17, "learning_rate": 1.892116164039392e-05, "loss": 1.3101, "step": 6399 }, { "epoch": 0.17, "learning_rate": 1.8920761979753056e-05, "loss": 1.4104, "step": 6400 }, { "epoch": 0.17, "learning_rate": 1.892036224932035e-05, "loss": 1.3833, "step": 6401 }, { "epoch": 0.17, "learning_rate": 1.891996244909892e-05, "loss": 1.3582, "step": 6402 }, { "epoch": 0.17, "learning_rate": 1.8919562579091896e-05, "loss": 1.4868, "step": 6403 }, { "epoch": 0.17, "learning_rate": 1.891916263930241e-05, "loss": 1.5823, "step": 6404 }, { "epoch": 0.17, "learning_rate": 1.8918762629733592e-05, "loss": 1.4907, "step": 6405 }, { "epoch": 0.17, "learning_rate": 1.891836255038857e-05, "loss": 1.3552, "step": 6406 }, { "epoch": 0.17, "learning_rate": 1.8917962401270468e-05, "loss": 1.3799, "step": 6407 }, { "epoch": 0.17, "learning_rate": 1.8917562182382425e-05, "loss": 1.4819, "step": 6408 }, { "epoch": 0.18, "learning_rate": 1.891716189372757e-05, "loss": 1.4036, "step": 6409 }, { "epoch": 0.18, "learning_rate": 1.8916761535309032e-05, "loss": 1.2405, "step": 6410 }, { "epoch": 0.18, "learning_rate": 1.8916361107129943e-05, "loss": 1.3152, "step": 6411 }, { "epoch": 0.18, "learning_rate": 1.891596060919344e-05, "loss": 1.3525, "step": 6412 }, { "epoch": 0.18, "learning_rate": 1.8915560041502652e-05, "loss": 1.3232, "step": 6413 }, { "epoch": 0.18, "learning_rate": 1.8915159404060716e-05, "loss": 1.6431, "step": 6414 }, { "epoch": 0.18, "learning_rate": 1.8914758696870766e-05, "loss": 1.3076, "step": 6415 }, { "epoch": 0.18, "learning_rate": 1.8914357919935933e-05, "loss": 1.2893, "step": 6416 }, { "epoch": 0.18, "learning_rate": 1.8913957073259356e-05, "loss": 1.4021, "step": 6417 }, { "epoch": 0.18, "learning_rate": 1.8913556156844174e-05, "loss": 1.2646, "step": 6418 }, { "epoch": 0.18, "learning_rate": 1.8913155170693514e-05, "loss": 1.5454, "step": 6419 }, { "epoch": 0.18, "learning_rate": 1.8912754114810522e-05, "loss": 1.1135, "step": 6420 }, { "epoch": 0.18, "learning_rate": 1.8912352989198334e-05, "loss": 1.5288, "step": 6421 }, { "epoch": 0.18, "learning_rate": 1.8911951793860092e-05, "loss": 1.5083, "step": 6422 }, { "epoch": 0.18, "learning_rate": 1.8911550528798922e-05, "loss": 1.5532, "step": 6423 }, { "epoch": 0.18, "learning_rate": 1.8911149194017972e-05, "loss": 1.5552, "step": 6424 }, { "epoch": 0.18, "learning_rate": 1.8910747789520383e-05, "loss": 1.4309, "step": 6425 }, { "epoch": 0.18, "learning_rate": 1.8910346315309292e-05, "loss": 1.3074, "step": 6426 }, { "epoch": 0.18, "learning_rate": 1.8909944771387844e-05, "loss": 1.4175, "step": 6427 }, { "epoch": 0.18, "learning_rate": 1.890954315775918e-05, "loss": 1.5127, "step": 6428 }, { "epoch": 0.18, "learning_rate": 1.8909141474426434e-05, "loss": 1.4097, "step": 6429 }, { "epoch": 0.18, "learning_rate": 1.8908739721392754e-05, "loss": 1.4399, "step": 6430 }, { "epoch": 0.18, "learning_rate": 1.8908337898661287e-05, "loss": 1.5679, "step": 6431 }, { "epoch": 0.18, "learning_rate": 1.8907936006235173e-05, "loss": 1.3906, "step": 6432 }, { "epoch": 0.18, "learning_rate": 1.8907534044117556e-05, "loss": 1.3435, "step": 6433 }, { "epoch": 0.18, "learning_rate": 1.8907132012311585e-05, "loss": 1.2161, "step": 6434 }, { "epoch": 0.18, "learning_rate": 1.8906729910820395e-05, "loss": 1.4568, "step": 6435 }, { "epoch": 0.18, "learning_rate": 1.8906327739647143e-05, "loss": 1.3821, "step": 6436 }, { "epoch": 0.18, "learning_rate": 1.8905925498794968e-05, "loss": 1.3542, "step": 6437 }, { "epoch": 0.18, "learning_rate": 1.890552318826702e-05, "loss": 1.3394, "step": 6438 }, { "epoch": 0.18, "learning_rate": 1.8905120808066448e-05, "loss": 1.3955, "step": 6439 }, { "epoch": 0.18, "learning_rate": 1.8904718358196398e-05, "loss": 1.3628, "step": 6440 }, { "epoch": 0.18, "learning_rate": 1.890431583866002e-05, "loss": 1.3723, "step": 6441 }, { "epoch": 0.18, "learning_rate": 1.890391324946046e-05, "loss": 1.5889, "step": 6442 }, { "epoch": 0.18, "learning_rate": 1.8903510590600868e-05, "loss": 1.3206, "step": 6443 }, { "epoch": 0.18, "learning_rate": 1.89031078620844e-05, "loss": 1.458, "step": 6444 }, { "epoch": 0.18, "learning_rate": 1.8902705063914197e-05, "loss": 1.375, "step": 6445 }, { "epoch": 0.18, "learning_rate": 1.8902302196093422e-05, "loss": 1.45, "step": 6446 }, { "epoch": 0.18, "learning_rate": 1.8901899258625217e-05, "loss": 1.5142, "step": 6447 }, { "epoch": 0.18, "learning_rate": 1.890149625151274e-05, "loss": 1.4004, "step": 6448 }, { "epoch": 0.18, "learning_rate": 1.8901093174759138e-05, "loss": 1.4478, "step": 6449 }, { "epoch": 0.18, "learning_rate": 1.8900690028367577e-05, "loss": 1.3845, "step": 6450 }, { "epoch": 0.18, "learning_rate": 1.8900286812341196e-05, "loss": 1.4895, "step": 6451 }, { "epoch": 0.18, "learning_rate": 1.8899883526683157e-05, "loss": 1.3687, "step": 6452 }, { "epoch": 0.18, "learning_rate": 1.8899480171396615e-05, "loss": 1.5537, "step": 6453 }, { "epoch": 0.18, "learning_rate": 1.8899076746484727e-05, "loss": 1.3696, "step": 6454 }, { "epoch": 0.18, "learning_rate": 1.8898673251950643e-05, "loss": 1.417, "step": 6455 }, { "epoch": 0.18, "learning_rate": 1.889826968779753e-05, "loss": 1.429, "step": 6456 }, { "epoch": 0.18, "learning_rate": 1.8897866054028533e-05, "loss": 1.3264, "step": 6457 }, { "epoch": 0.18, "learning_rate": 1.8897462350646818e-05, "loss": 1.355, "step": 6458 }, { "epoch": 0.18, "learning_rate": 1.889705857765554e-05, "loss": 1.3025, "step": 6459 }, { "epoch": 0.18, "learning_rate": 1.8896654735057864e-05, "loss": 1.4272, "step": 6460 }, { "epoch": 0.18, "learning_rate": 1.889625082285694e-05, "loss": 1.2603, "step": 6461 }, { "epoch": 0.18, "learning_rate": 1.8895846841055936e-05, "loss": 1.3398, "step": 6462 }, { "epoch": 0.18, "learning_rate": 1.889544278965801e-05, "loss": 1.4097, "step": 6463 }, { "epoch": 0.18, "learning_rate": 1.889503866866632e-05, "loss": 1.2112, "step": 6464 }, { "epoch": 0.18, "learning_rate": 1.889463447808403e-05, "loss": 1.7588, "step": 6465 }, { "epoch": 0.18, "learning_rate": 1.8894230217914304e-05, "loss": 1.2744, "step": 6466 }, { "epoch": 0.18, "learning_rate": 1.8893825888160304e-05, "loss": 1.3506, "step": 6467 }, { "epoch": 0.18, "learning_rate": 1.889342148882519e-05, "loss": 1.4175, "step": 6468 }, { "epoch": 0.18, "learning_rate": 1.889301701991213e-05, "loss": 1.3662, "step": 6469 }, { "epoch": 0.18, "learning_rate": 1.8892612481424286e-05, "loss": 1.4014, "step": 6470 }, { "epoch": 0.18, "learning_rate": 1.8892207873364824e-05, "loss": 1.2322, "step": 6471 }, { "epoch": 0.18, "learning_rate": 1.889180319573691e-05, "loss": 1.4839, "step": 6472 }, { "epoch": 0.18, "learning_rate": 1.8891398448543707e-05, "loss": 1.4121, "step": 6473 }, { "epoch": 0.18, "learning_rate": 1.8890993631788384e-05, "loss": 1.4128, "step": 6474 }, { "epoch": 0.18, "learning_rate": 1.8890588745474106e-05, "loss": 1.4619, "step": 6475 }, { "epoch": 0.18, "learning_rate": 1.8890183789604047e-05, "loss": 1.5676, "step": 6476 }, { "epoch": 0.18, "learning_rate": 1.8889778764181365e-05, "loss": 1.3477, "step": 6477 }, { "epoch": 0.18, "learning_rate": 1.8889373669209237e-05, "loss": 1.5195, "step": 6478 }, { "epoch": 0.18, "learning_rate": 1.888896850469083e-05, "loss": 1.3418, "step": 6479 }, { "epoch": 0.18, "learning_rate": 1.8888563270629313e-05, "loss": 1.3818, "step": 6480 }, { "epoch": 0.18, "learning_rate": 1.8888157967027855e-05, "loss": 1.4214, "step": 6481 }, { "epoch": 0.18, "learning_rate": 1.8887752593889634e-05, "loss": 1.2759, "step": 6482 }, { "epoch": 0.18, "learning_rate": 1.888734715121781e-05, "loss": 1.3989, "step": 6483 }, { "epoch": 0.18, "learning_rate": 1.8886941639015563e-05, "loss": 1.2612, "step": 6484 }, { "epoch": 0.18, "learning_rate": 1.8886536057286063e-05, "loss": 1.407, "step": 6485 }, { "epoch": 0.18, "learning_rate": 1.8886130406032484e-05, "loss": 1.2852, "step": 6486 }, { "epoch": 0.18, "learning_rate": 1.8885724685258e-05, "loss": 1.2986, "step": 6487 }, { "epoch": 0.18, "learning_rate": 1.8885318894965782e-05, "loss": 1.3394, "step": 6488 }, { "epoch": 0.18, "learning_rate": 1.8884913035159008e-05, "loss": 1.3088, "step": 6489 }, { "epoch": 0.18, "learning_rate": 1.8884507105840854e-05, "loss": 1.4062, "step": 6490 }, { "epoch": 0.18, "learning_rate": 1.8884101107014495e-05, "loss": 1.2214, "step": 6491 }, { "epoch": 0.18, "learning_rate": 1.8883695038683103e-05, "loss": 1.4336, "step": 6492 }, { "epoch": 0.18, "learning_rate": 1.8883288900849863e-05, "loss": 1.3445, "step": 6493 }, { "epoch": 0.18, "learning_rate": 1.8882882693517945e-05, "loss": 1.4556, "step": 6494 }, { "epoch": 0.18, "learning_rate": 1.888247641669053e-05, "loss": 1.6675, "step": 6495 }, { "epoch": 0.18, "learning_rate": 1.8882070070370794e-05, "loss": 1.3047, "step": 6496 }, { "epoch": 0.18, "learning_rate": 1.8881663654561923e-05, "loss": 1.4839, "step": 6497 }, { "epoch": 0.18, "learning_rate": 1.8881257169267087e-05, "loss": 1.2534, "step": 6498 }, { "epoch": 0.18, "learning_rate": 1.8880850614489478e-05, "loss": 1.511, "step": 6499 }, { "epoch": 0.18, "learning_rate": 1.8880443990232263e-05, "loss": 1.3696, "step": 6500 }, { "epoch": 0.18, "learning_rate": 1.8880037296498635e-05, "loss": 1.4458, "step": 6501 }, { "epoch": 0.18, "learning_rate": 1.8879630533291767e-05, "loss": 1.3635, "step": 6502 }, { "epoch": 0.18, "learning_rate": 1.887922370061485e-05, "loss": 1.2288, "step": 6503 }, { "epoch": 0.18, "learning_rate": 1.8878816798471058e-05, "loss": 1.3955, "step": 6504 }, { "epoch": 0.18, "learning_rate": 1.8878409826863578e-05, "loss": 1.2358, "step": 6505 }, { "epoch": 0.18, "learning_rate": 1.88780027857956e-05, "loss": 1.5103, "step": 6506 }, { "epoch": 0.18, "learning_rate": 1.88775956752703e-05, "loss": 1.3965, "step": 6507 }, { "epoch": 0.18, "learning_rate": 1.8877188495290864e-05, "loss": 1.4521, "step": 6508 }, { "epoch": 0.18, "learning_rate": 1.8876781245860478e-05, "loss": 1.4668, "step": 6509 }, { "epoch": 0.18, "learning_rate": 1.8876373926982334e-05, "loss": 1.3691, "step": 6510 }, { "epoch": 0.18, "learning_rate": 1.8875966538659612e-05, "loss": 1.218, "step": 6511 }, { "epoch": 0.18, "learning_rate": 1.8875559080895503e-05, "loss": 1.29, "step": 6512 }, { "epoch": 0.18, "learning_rate": 1.887515155369319e-05, "loss": 1.3708, "step": 6513 }, { "epoch": 0.18, "learning_rate": 1.8874743957055868e-05, "loss": 1.4272, "step": 6514 }, { "epoch": 0.18, "learning_rate": 1.8874336290986722e-05, "loss": 1.3896, "step": 6515 }, { "epoch": 0.18, "learning_rate": 1.8873928555488942e-05, "loss": 1.4678, "step": 6516 }, { "epoch": 0.18, "learning_rate": 1.8873520750565716e-05, "loss": 1.3672, "step": 6517 }, { "epoch": 0.18, "learning_rate": 1.887311287622024e-05, "loss": 1.3438, "step": 6518 }, { "epoch": 0.18, "learning_rate": 1.88727049324557e-05, "loss": 1.387, "step": 6519 }, { "epoch": 0.18, "learning_rate": 1.8872296919275287e-05, "loss": 1.4329, "step": 6520 }, { "epoch": 0.18, "learning_rate": 1.8871888836682196e-05, "loss": 1.1348, "step": 6521 }, { "epoch": 0.18, "learning_rate": 1.8871480684679617e-05, "loss": 1.2346, "step": 6522 }, { "epoch": 0.18, "learning_rate": 1.887107246327075e-05, "loss": 1.5364, "step": 6523 }, { "epoch": 0.18, "learning_rate": 1.8870664172458775e-05, "loss": 1.5293, "step": 6524 }, { "epoch": 0.18, "learning_rate": 1.8870255812246898e-05, "loss": 1.4912, "step": 6525 }, { "epoch": 0.18, "learning_rate": 1.8869847382638313e-05, "loss": 1.877, "step": 6526 }, { "epoch": 0.18, "learning_rate": 1.8869438883636212e-05, "loss": 1.2893, "step": 6527 }, { "epoch": 0.18, "learning_rate": 1.8869030315243793e-05, "loss": 1.4678, "step": 6528 }, { "epoch": 0.18, "learning_rate": 1.886862167746425e-05, "loss": 1.2749, "step": 6529 }, { "epoch": 0.18, "learning_rate": 1.886821297030078e-05, "loss": 1.4033, "step": 6530 }, { "epoch": 0.18, "learning_rate": 1.8867804193756585e-05, "loss": 1.4155, "step": 6531 }, { "epoch": 0.18, "learning_rate": 1.8867395347834857e-05, "loss": 1.4023, "step": 6532 }, { "epoch": 0.18, "learning_rate": 1.88669864325388e-05, "loss": 1.4888, "step": 6533 }, { "epoch": 0.18, "learning_rate": 1.886657744787161e-05, "loss": 1.408, "step": 6534 }, { "epoch": 0.18, "learning_rate": 1.8866168393836485e-05, "loss": 1.438, "step": 6535 }, { "epoch": 0.18, "learning_rate": 1.886575927043663e-05, "loss": 1.3069, "step": 6536 }, { "epoch": 0.18, "learning_rate": 1.8865350077675243e-05, "loss": 1.4233, "step": 6537 }, { "epoch": 0.18, "learning_rate": 1.8864940815555525e-05, "loss": 1.4158, "step": 6538 }, { "epoch": 0.18, "learning_rate": 1.886453148408068e-05, "loss": 1.4993, "step": 6539 }, { "epoch": 0.18, "learning_rate": 1.8864122083253908e-05, "loss": 1.3442, "step": 6540 }, { "epoch": 0.18, "learning_rate": 1.8863712613078415e-05, "loss": 1.355, "step": 6541 }, { "epoch": 0.18, "learning_rate": 1.8863303073557403e-05, "loss": 1.4023, "step": 6542 }, { "epoch": 0.18, "learning_rate": 1.8862893464694072e-05, "loss": 1.5879, "step": 6543 }, { "epoch": 0.18, "learning_rate": 1.886248378649163e-05, "loss": 1.2261, "step": 6544 }, { "epoch": 0.18, "learning_rate": 1.8862074038953286e-05, "loss": 1.3157, "step": 6545 }, { "epoch": 0.18, "learning_rate": 1.8861664222082238e-05, "loss": 1.4302, "step": 6546 }, { "epoch": 0.18, "learning_rate": 1.88612543358817e-05, "loss": 1.2996, "step": 6547 }, { "epoch": 0.18, "learning_rate": 1.886084438035487e-05, "loss": 1.3591, "step": 6548 }, { "epoch": 0.18, "learning_rate": 1.8860434355504966e-05, "loss": 1.4106, "step": 6549 }, { "epoch": 0.18, "learning_rate": 1.886002426133519e-05, "loss": 1.8008, "step": 6550 }, { "epoch": 0.18, "learning_rate": 1.8859614097848748e-05, "loss": 1.3755, "step": 6551 }, { "epoch": 0.18, "learning_rate": 1.885920386504885e-05, "loss": 1.5166, "step": 6552 }, { "epoch": 0.18, "learning_rate": 1.8858793562938707e-05, "loss": 1.3123, "step": 6553 }, { "epoch": 0.18, "learning_rate": 1.885838319152153e-05, "loss": 1.4094, "step": 6554 }, { "epoch": 0.18, "learning_rate": 1.885797275080053e-05, "loss": 1.5027, "step": 6555 }, { "epoch": 0.18, "learning_rate": 1.8857562240778914e-05, "loss": 1.4033, "step": 6556 }, { "epoch": 0.18, "learning_rate": 1.8857151661459896e-05, "loss": 1.1963, "step": 6557 }, { "epoch": 0.18, "learning_rate": 1.8856741012846692e-05, "loss": 1.4375, "step": 6558 }, { "epoch": 0.18, "learning_rate": 1.8856330294942506e-05, "loss": 1.2498, "step": 6559 }, { "epoch": 0.18, "learning_rate": 1.885591950775056e-05, "loss": 1.4067, "step": 6560 }, { "epoch": 0.18, "learning_rate": 1.8855508651274063e-05, "loss": 1.3245, "step": 6561 }, { "epoch": 0.18, "learning_rate": 1.885509772551623e-05, "loss": 1.416, "step": 6562 }, { "epoch": 0.18, "learning_rate": 1.8854686730480274e-05, "loss": 1.3152, "step": 6563 }, { "epoch": 0.18, "learning_rate": 1.8854275666169416e-05, "loss": 1.5034, "step": 6564 }, { "epoch": 0.18, "learning_rate": 1.885386453258687e-05, "loss": 1.3848, "step": 6565 }, { "epoch": 0.18, "learning_rate": 1.885345332973585e-05, "loss": 1.4138, "step": 6566 }, { "epoch": 0.18, "learning_rate": 1.8853042057619574e-05, "loss": 1.4702, "step": 6567 }, { "epoch": 0.18, "learning_rate": 1.8852630716241257e-05, "loss": 1.375, "step": 6568 }, { "epoch": 0.18, "learning_rate": 1.8852219305604125e-05, "loss": 1.3875, "step": 6569 }, { "epoch": 0.18, "learning_rate": 1.8851807825711387e-05, "loss": 1.5342, "step": 6570 }, { "epoch": 0.18, "learning_rate": 1.8851396276566272e-05, "loss": 1.3374, "step": 6571 }, { "epoch": 0.18, "learning_rate": 1.8850984658171992e-05, "loss": 1.5791, "step": 6572 }, { "epoch": 0.18, "learning_rate": 1.885057297053177e-05, "loss": 1.4795, "step": 6573 }, { "epoch": 0.18, "learning_rate": 1.885016121364883e-05, "loss": 1.4648, "step": 6574 }, { "epoch": 0.18, "learning_rate": 1.8849749387526387e-05, "loss": 1.3232, "step": 6575 }, { "epoch": 0.18, "learning_rate": 1.8849337492167664e-05, "loss": 1.6641, "step": 6576 }, { "epoch": 0.18, "learning_rate": 1.884892552757589e-05, "loss": 1.3074, "step": 6577 }, { "epoch": 0.18, "learning_rate": 1.8848513493754282e-05, "loss": 1.3538, "step": 6578 }, { "epoch": 0.18, "learning_rate": 1.8848101390706066e-05, "loss": 1.4104, "step": 6579 }, { "epoch": 0.18, "learning_rate": 1.8847689218434465e-05, "loss": 1.3298, "step": 6580 }, { "epoch": 0.18, "learning_rate": 1.8847276976942705e-05, "loss": 1.3608, "step": 6581 }, { "epoch": 0.18, "learning_rate": 1.8846864666234008e-05, "loss": 1.4373, "step": 6582 }, { "epoch": 0.18, "learning_rate": 1.8846452286311602e-05, "loss": 1.5444, "step": 6583 }, { "epoch": 0.18, "learning_rate": 1.8846039837178717e-05, "loss": 1.1938, "step": 6584 }, { "epoch": 0.18, "learning_rate": 1.8845627318838572e-05, "loss": 1.3125, "step": 6585 }, { "epoch": 0.18, "learning_rate": 1.8845214731294398e-05, "loss": 1.4929, "step": 6586 }, { "epoch": 0.18, "learning_rate": 1.8844802074549428e-05, "loss": 1.1919, "step": 6587 }, { "epoch": 0.18, "learning_rate": 1.884438934860688e-05, "loss": 1.2583, "step": 6588 }, { "epoch": 0.18, "learning_rate": 1.8843976553469995e-05, "loss": 1.5681, "step": 6589 }, { "epoch": 0.18, "learning_rate": 1.8843563689141987e-05, "loss": 1.438, "step": 6590 }, { "epoch": 0.18, "learning_rate": 1.8843150755626104e-05, "loss": 1.4253, "step": 6591 }, { "epoch": 0.18, "learning_rate": 1.8842737752925564e-05, "loss": 1.4521, "step": 6592 }, { "epoch": 0.18, "learning_rate": 1.8842324681043604e-05, "loss": 1.2371, "step": 6593 }, { "epoch": 0.18, "learning_rate": 1.884191153998345e-05, "loss": 1.4575, "step": 6594 }, { "epoch": 0.18, "learning_rate": 1.884149832974834e-05, "loss": 1.3828, "step": 6595 }, { "epoch": 0.18, "learning_rate": 1.8841085050341506e-05, "loss": 1.356, "step": 6596 }, { "epoch": 0.18, "learning_rate": 1.8840671701766178e-05, "loss": 1.4407, "step": 6597 }, { "epoch": 0.18, "learning_rate": 1.8840258284025592e-05, "loss": 1.2781, "step": 6598 }, { "epoch": 0.18, "learning_rate": 1.8839844797122983e-05, "loss": 1.4561, "step": 6599 }, { "epoch": 0.18, "learning_rate": 1.8839431241061585e-05, "loss": 1.3779, "step": 6600 }, { "epoch": 0.18, "learning_rate": 1.8839017615844635e-05, "loss": 1.3997, "step": 6601 }, { "epoch": 0.18, "learning_rate": 1.8838603921475364e-05, "loss": 1.3848, "step": 6602 }, { "epoch": 0.18, "learning_rate": 1.8838190157957013e-05, "loss": 1.3524, "step": 6603 }, { "epoch": 0.18, "learning_rate": 1.883777632529282e-05, "loss": 1.4277, "step": 6604 }, { "epoch": 0.18, "learning_rate": 1.883736242348602e-05, "loss": 1.397, "step": 6605 }, { "epoch": 0.18, "learning_rate": 1.883694845253985e-05, "loss": 1.2151, "step": 6606 }, { "epoch": 0.18, "learning_rate": 1.8836534412457555e-05, "loss": 1.387, "step": 6607 }, { "epoch": 0.18, "learning_rate": 1.8836120303242368e-05, "loss": 1.3677, "step": 6608 }, { "epoch": 0.18, "learning_rate": 1.8835706124897532e-05, "loss": 1.3579, "step": 6609 }, { "epoch": 0.18, "learning_rate": 1.8835291877426283e-05, "loss": 1.5034, "step": 6610 }, { "epoch": 0.18, "learning_rate": 1.8834877560831867e-05, "loss": 1.3826, "step": 6611 }, { "epoch": 0.18, "learning_rate": 1.8834463175117522e-05, "loss": 1.4082, "step": 6612 }, { "epoch": 0.18, "learning_rate": 1.8834048720286492e-05, "loss": 1.5303, "step": 6613 }, { "epoch": 0.18, "learning_rate": 1.883363419634202e-05, "loss": 1.3501, "step": 6614 }, { "epoch": 0.18, "learning_rate": 1.8833219603287348e-05, "loss": 1.3306, "step": 6615 }, { "epoch": 0.18, "learning_rate": 1.883280494112572e-05, "loss": 1.3447, "step": 6616 }, { "epoch": 0.18, "learning_rate": 1.8832390209860377e-05, "loss": 1.2712, "step": 6617 }, { "epoch": 0.18, "learning_rate": 1.883197540949457e-05, "loss": 1.4541, "step": 6618 }, { "epoch": 0.18, "learning_rate": 1.8831560540031536e-05, "loss": 1.4092, "step": 6619 }, { "epoch": 0.18, "learning_rate": 1.8831145601474525e-05, "loss": 1.5229, "step": 6620 }, { "epoch": 0.18, "learning_rate": 1.8830730593826787e-05, "loss": 1.3357, "step": 6621 }, { "epoch": 0.18, "learning_rate": 1.8830315517091564e-05, "loss": 1.4771, "step": 6622 }, { "epoch": 0.18, "learning_rate": 1.8829900371272106e-05, "loss": 1.4912, "step": 6623 }, { "epoch": 0.18, "learning_rate": 1.882948515637166e-05, "loss": 1.3262, "step": 6624 }, { "epoch": 0.18, "learning_rate": 1.882906987239347e-05, "loss": 1.4297, "step": 6625 }, { "epoch": 0.18, "learning_rate": 1.882865451934079e-05, "loss": 1.3757, "step": 6626 }, { "epoch": 0.18, "learning_rate": 1.8828239097216872e-05, "loss": 1.4229, "step": 6627 }, { "epoch": 0.18, "learning_rate": 1.882782360602496e-05, "loss": 1.3879, "step": 6628 }, { "epoch": 0.18, "learning_rate": 1.8827408045768308e-05, "loss": 1.416, "step": 6629 }, { "epoch": 0.18, "learning_rate": 1.8826992416450168e-05, "loss": 1.5186, "step": 6630 }, { "epoch": 0.18, "learning_rate": 1.882657671807379e-05, "loss": 1.322, "step": 6631 }, { "epoch": 0.18, "learning_rate": 1.8826160950642424e-05, "loss": 1.2104, "step": 6632 }, { "epoch": 0.18, "learning_rate": 1.8825745114159324e-05, "loss": 1.3918, "step": 6633 }, { "epoch": 0.18, "learning_rate": 1.8825329208627745e-05, "loss": 1.5005, "step": 6634 }, { "epoch": 0.18, "learning_rate": 1.8824913234050943e-05, "loss": 1.3916, "step": 6635 }, { "epoch": 0.18, "learning_rate": 1.8824497190432167e-05, "loss": 1.2847, "step": 6636 }, { "epoch": 0.18, "learning_rate": 1.8824081077774677e-05, "loss": 1.4316, "step": 6637 }, { "epoch": 0.18, "learning_rate": 1.8823664896081724e-05, "loss": 1.3438, "step": 6638 }, { "epoch": 0.18, "learning_rate": 1.8823248645356565e-05, "loss": 1.3789, "step": 6639 }, { "epoch": 0.18, "learning_rate": 1.882283232560246e-05, "loss": 1.502, "step": 6640 }, { "epoch": 0.18, "learning_rate": 1.8822415936822664e-05, "loss": 1.1692, "step": 6641 }, { "epoch": 0.18, "learning_rate": 1.8821999479020433e-05, "loss": 1.2361, "step": 6642 }, { "epoch": 0.18, "learning_rate": 1.8821582952199027e-05, "loss": 1.3904, "step": 6643 }, { "epoch": 0.18, "learning_rate": 1.8821166356361705e-05, "loss": 1.3447, "step": 6644 }, { "epoch": 0.18, "learning_rate": 1.8820749691511723e-05, "loss": 1.4902, "step": 6645 }, { "epoch": 0.18, "learning_rate": 1.8820332957652344e-05, "loss": 1.3784, "step": 6646 }, { "epoch": 0.18, "learning_rate": 1.881991615478683e-05, "loss": 1.324, "step": 6647 }, { "epoch": 0.18, "learning_rate": 1.8819499282918436e-05, "loss": 1.5034, "step": 6648 }, { "epoch": 0.18, "learning_rate": 1.881908234205043e-05, "loss": 1.52, "step": 6649 }, { "epoch": 0.18, "learning_rate": 1.881866533218607e-05, "loss": 1.3989, "step": 6650 }, { "epoch": 0.18, "learning_rate": 1.881824825332862e-05, "loss": 1.5249, "step": 6651 }, { "epoch": 0.18, "learning_rate": 1.8817831105481338e-05, "loss": 1.4912, "step": 6652 }, { "epoch": 0.18, "learning_rate": 1.8817413888647492e-05, "loss": 1.4395, "step": 6653 }, { "epoch": 0.18, "learning_rate": 1.881699660283035e-05, "loss": 1.3315, "step": 6654 }, { "epoch": 0.18, "learning_rate": 1.881657924803317e-05, "loss": 1.314, "step": 6655 }, { "epoch": 0.18, "learning_rate": 1.8816161824259224e-05, "loss": 1.3328, "step": 6656 }, { "epoch": 0.18, "learning_rate": 1.881574433151177e-05, "loss": 1.4019, "step": 6657 }, { "epoch": 0.18, "learning_rate": 1.8815326769794077e-05, "loss": 1.3093, "step": 6658 }, { "epoch": 0.18, "learning_rate": 1.8814909139109413e-05, "loss": 1.498, "step": 6659 }, { "epoch": 0.18, "learning_rate": 1.8814491439461045e-05, "loss": 1.3765, "step": 6660 }, { "epoch": 0.18, "learning_rate": 1.8814073670852245e-05, "loss": 1.4236, "step": 6661 }, { "epoch": 0.18, "learning_rate": 1.8813655833286273e-05, "loss": 1.4111, "step": 6662 }, { "epoch": 0.18, "learning_rate": 1.8813237926766404e-05, "loss": 1.3035, "step": 6663 }, { "epoch": 0.18, "learning_rate": 1.8812819951295906e-05, "loss": 1.3403, "step": 6664 }, { "epoch": 0.18, "learning_rate": 1.8812401906878043e-05, "loss": 1.3682, "step": 6665 }, { "epoch": 0.18, "learning_rate": 1.8811983793516097e-05, "loss": 1.2812, "step": 6666 }, { "epoch": 0.18, "learning_rate": 1.8811565611213332e-05, "loss": 1.3474, "step": 6667 }, { "epoch": 0.18, "learning_rate": 1.8811147359973026e-05, "loss": 1.4192, "step": 6668 }, { "epoch": 0.18, "learning_rate": 1.881072903979844e-05, "loss": 1.3909, "step": 6669 }, { "epoch": 0.18, "learning_rate": 1.8810310650692857e-05, "loss": 1.356, "step": 6670 }, { "epoch": 0.18, "learning_rate": 1.8809892192659544e-05, "loss": 1.4268, "step": 6671 }, { "epoch": 0.18, "learning_rate": 1.8809473665701777e-05, "loss": 1.439, "step": 6672 }, { "epoch": 0.18, "learning_rate": 1.880905506982283e-05, "loss": 1.2441, "step": 6673 }, { "epoch": 0.18, "learning_rate": 1.8808636405025978e-05, "loss": 1.5427, "step": 6674 }, { "epoch": 0.18, "learning_rate": 1.8808217671314503e-05, "loss": 1.4084, "step": 6675 }, { "epoch": 0.18, "learning_rate": 1.880779886869167e-05, "loss": 1.4092, "step": 6676 }, { "epoch": 0.18, "learning_rate": 1.880737999716076e-05, "loss": 1.7886, "step": 6677 }, { "epoch": 0.18, "learning_rate": 1.880696105672505e-05, "loss": 1.2158, "step": 6678 }, { "epoch": 0.18, "learning_rate": 1.880654204738782e-05, "loss": 1.5063, "step": 6679 }, { "epoch": 0.18, "learning_rate": 1.8806122969152347e-05, "loss": 1.4241, "step": 6680 }, { "epoch": 0.18, "learning_rate": 1.8805703822021904e-05, "loss": 1.3074, "step": 6681 }, { "epoch": 0.18, "learning_rate": 1.880528460599978e-05, "loss": 1.5068, "step": 6682 }, { "epoch": 0.18, "learning_rate": 1.8804865321089246e-05, "loss": 1.3442, "step": 6683 }, { "epoch": 0.18, "learning_rate": 1.880444596729359e-05, "loss": 1.4153, "step": 6684 }, { "epoch": 0.18, "learning_rate": 1.880402654461609e-05, "loss": 1.3794, "step": 6685 }, { "epoch": 0.18, "learning_rate": 1.880360705306002e-05, "loss": 1.4785, "step": 6686 }, { "epoch": 0.18, "learning_rate": 1.880318749262867e-05, "loss": 1.3796, "step": 6687 }, { "epoch": 0.18, "learning_rate": 1.8802767863325323e-05, "loss": 1.2769, "step": 6688 }, { "epoch": 0.18, "learning_rate": 1.880234816515326e-05, "loss": 1.5391, "step": 6689 }, { "epoch": 0.18, "learning_rate": 1.880192839811576e-05, "loss": 1.4094, "step": 6690 }, { "epoch": 0.18, "learning_rate": 1.8801508562216114e-05, "loss": 1.4822, "step": 6691 }, { "epoch": 0.18, "learning_rate": 1.8801088657457605e-05, "loss": 1.3994, "step": 6692 }, { "epoch": 0.18, "learning_rate": 1.8800668683843515e-05, "loss": 1.4707, "step": 6693 }, { "epoch": 0.18, "learning_rate": 1.8800248641377134e-05, "loss": 1.1853, "step": 6694 }, { "epoch": 0.18, "learning_rate": 1.8799828530061742e-05, "loss": 1.4639, "step": 6695 }, { "epoch": 0.18, "learning_rate": 1.8799408349900634e-05, "loss": 1.3682, "step": 6696 }, { "epoch": 0.18, "learning_rate": 1.8798988100897092e-05, "loss": 1.3486, "step": 6697 }, { "epoch": 0.18, "learning_rate": 1.87985677830544e-05, "loss": 1.4685, "step": 6698 }, { "epoch": 0.18, "learning_rate": 1.8798147396375855e-05, "loss": 1.3418, "step": 6699 }, { "epoch": 0.18, "learning_rate": 1.879772694086474e-05, "loss": 1.792, "step": 6700 }, { "epoch": 0.18, "learning_rate": 1.879730641652435e-05, "loss": 1.4202, "step": 6701 }, { "epoch": 0.18, "learning_rate": 1.8796885823357965e-05, "loss": 1.3645, "step": 6702 }, { "epoch": 0.18, "learning_rate": 1.8796465161368887e-05, "loss": 1.2983, "step": 6703 }, { "epoch": 0.18, "learning_rate": 1.87960444305604e-05, "loss": 1.4553, "step": 6704 }, { "epoch": 0.18, "learning_rate": 1.8795623630935797e-05, "loss": 1.4932, "step": 6705 }, { "epoch": 0.18, "learning_rate": 1.8795202762498376e-05, "loss": 1.4966, "step": 6706 }, { "epoch": 0.18, "learning_rate": 1.8794781825251417e-05, "loss": 1.3984, "step": 6707 }, { "epoch": 0.18, "learning_rate": 1.8794360819198226e-05, "loss": 1.3325, "step": 6708 }, { "epoch": 0.18, "learning_rate": 1.8793939744342088e-05, "loss": 1.4031, "step": 6709 }, { "epoch": 0.18, "learning_rate": 1.87935186006863e-05, "loss": 1.7622, "step": 6710 }, { "epoch": 0.18, "learning_rate": 1.879309738823416e-05, "loss": 1.2727, "step": 6711 }, { "epoch": 0.18, "learning_rate": 1.879267610698896e-05, "loss": 1.2883, "step": 6712 }, { "epoch": 0.18, "learning_rate": 1.8792254756954e-05, "loss": 1.3667, "step": 6713 }, { "epoch": 0.18, "learning_rate": 1.879183333813257e-05, "loss": 1.4399, "step": 6714 }, { "epoch": 0.18, "learning_rate": 1.879141185052797e-05, "loss": 1.2859, "step": 6715 }, { "epoch": 0.18, "learning_rate": 1.87909902941435e-05, "loss": 1.3071, "step": 6716 }, { "epoch": 0.18, "learning_rate": 1.8790568668982453e-05, "loss": 1.3704, "step": 6717 }, { "epoch": 0.18, "learning_rate": 1.879014697504813e-05, "loss": 1.4087, "step": 6718 }, { "epoch": 0.18, "learning_rate": 1.878972521234383e-05, "loss": 1.4231, "step": 6719 }, { "epoch": 0.18, "learning_rate": 1.8789303380872855e-05, "loss": 1.4072, "step": 6720 }, { "epoch": 0.18, "learning_rate": 1.8788881480638506e-05, "loss": 1.3032, "step": 6721 }, { "epoch": 0.18, "learning_rate": 1.8788459511644074e-05, "loss": 1.4653, "step": 6722 }, { "epoch": 0.18, "learning_rate": 1.8788037473892875e-05, "loss": 1.4194, "step": 6723 }, { "epoch": 0.18, "learning_rate": 1.87876153673882e-05, "loss": 1.2866, "step": 6724 }, { "epoch": 0.18, "learning_rate": 1.8787193192133354e-05, "loss": 1.7339, "step": 6725 }, { "epoch": 0.18, "learning_rate": 1.878677094813164e-05, "loss": 1.3999, "step": 6726 }, { "epoch": 0.18, "learning_rate": 1.878634863538636e-05, "loss": 1.3735, "step": 6727 }, { "epoch": 0.18, "learning_rate": 1.8785926253900827e-05, "loss": 1.5244, "step": 6728 }, { "epoch": 0.18, "learning_rate": 1.8785503803678335e-05, "loss": 1.4346, "step": 6729 }, { "epoch": 0.18, "learning_rate": 1.878508128472219e-05, "loss": 1.4004, "step": 6730 }, { "epoch": 0.18, "learning_rate": 1.8784658697035703e-05, "loss": 1.2864, "step": 6731 }, { "epoch": 0.18, "learning_rate": 1.8784236040622176e-05, "loss": 1.428, "step": 6732 }, { "epoch": 0.18, "learning_rate": 1.8783813315484916e-05, "loss": 1.417, "step": 6733 }, { "epoch": 0.18, "learning_rate": 1.8783390521627232e-05, "loss": 1.3572, "step": 6734 }, { "epoch": 0.18, "learning_rate": 1.8782967659052432e-05, "loss": 1.2988, "step": 6735 }, { "epoch": 0.18, "learning_rate": 1.878254472776382e-05, "loss": 1.4697, "step": 6736 }, { "epoch": 0.18, "learning_rate": 1.878212172776471e-05, "loss": 1.3271, "step": 6737 }, { "epoch": 0.18, "learning_rate": 1.8781698659058408e-05, "loss": 1.792, "step": 6738 }, { "epoch": 0.18, "learning_rate": 1.8781275521648226e-05, "loss": 1.25, "step": 6739 }, { "epoch": 0.18, "learning_rate": 1.8780852315537473e-05, "loss": 1.3386, "step": 6740 }, { "epoch": 0.18, "learning_rate": 1.878042904072946e-05, "loss": 1.3025, "step": 6741 }, { "epoch": 0.18, "learning_rate": 1.87800056972275e-05, "loss": 1.2612, "step": 6742 }, { "epoch": 0.18, "learning_rate": 1.8779582285034904e-05, "loss": 1.4246, "step": 6743 }, { "epoch": 0.18, "learning_rate": 1.8779158804154987e-05, "loss": 1.4604, "step": 6744 }, { "epoch": 0.18, "learning_rate": 1.877873525459106e-05, "loss": 1.4312, "step": 6745 }, { "epoch": 0.18, "learning_rate": 1.8778311636346434e-05, "loss": 1.3413, "step": 6746 }, { "epoch": 0.18, "learning_rate": 1.8777887949424424e-05, "loss": 1.4546, "step": 6747 }, { "epoch": 0.18, "learning_rate": 1.877746419382835e-05, "loss": 1.3306, "step": 6748 }, { "epoch": 0.18, "learning_rate": 1.877704036956152e-05, "loss": 1.4272, "step": 6749 }, { "epoch": 0.18, "learning_rate": 1.8776616476627255e-05, "loss": 1.3242, "step": 6750 }, { "epoch": 0.18, "learning_rate": 1.877619251502887e-05, "loss": 1.3247, "step": 6751 }, { "epoch": 0.18, "learning_rate": 1.877576848476968e-05, "loss": 1.29, "step": 6752 }, { "epoch": 0.18, "learning_rate": 1.8775344385853005e-05, "loss": 1.3149, "step": 6753 }, { "epoch": 0.18, "learning_rate": 1.8774920218282166e-05, "loss": 1.209, "step": 6754 }, { "epoch": 0.18, "learning_rate": 1.8774495982060473e-05, "loss": 1.4238, "step": 6755 }, { "epoch": 0.18, "learning_rate": 1.8774071677191248e-05, "loss": 1.4829, "step": 6756 }, { "epoch": 0.18, "learning_rate": 1.8773647303677816e-05, "loss": 1.5278, "step": 6757 }, { "epoch": 0.18, "learning_rate": 1.877322286152349e-05, "loss": 1.5928, "step": 6758 }, { "epoch": 0.18, "learning_rate": 1.8772798350731595e-05, "loss": 1.3823, "step": 6759 }, { "epoch": 0.18, "learning_rate": 1.8772373771305454e-05, "loss": 1.4583, "step": 6760 }, { "epoch": 0.18, "learning_rate": 1.8771949123248382e-05, "loss": 1.4534, "step": 6761 }, { "epoch": 0.18, "learning_rate": 1.8771524406563706e-05, "loss": 1.3157, "step": 6762 }, { "epoch": 0.18, "learning_rate": 1.8771099621254748e-05, "loss": 1.4912, "step": 6763 }, { "epoch": 0.18, "learning_rate": 1.877067476732483e-05, "loss": 1.3594, "step": 6764 }, { "epoch": 0.18, "learning_rate": 1.8770249844777278e-05, "loss": 1.5142, "step": 6765 }, { "epoch": 0.18, "learning_rate": 1.8769824853615413e-05, "loss": 1.4897, "step": 6766 }, { "epoch": 0.18, "learning_rate": 1.8769399793842566e-05, "loss": 1.3916, "step": 6767 }, { "epoch": 0.18, "learning_rate": 1.8768974665462055e-05, "loss": 1.2668, "step": 6768 }, { "epoch": 0.18, "learning_rate": 1.8768549468477212e-05, "loss": 1.4019, "step": 6769 }, { "epoch": 0.18, "learning_rate": 1.8768124202891364e-05, "loss": 1.3098, "step": 6770 }, { "epoch": 0.18, "learning_rate": 1.876769886870783e-05, "loss": 1.3003, "step": 6771 }, { "epoch": 0.18, "learning_rate": 1.8767273465929943e-05, "loss": 1.5076, "step": 6772 }, { "epoch": 0.18, "learning_rate": 1.876684799456103e-05, "loss": 1.4958, "step": 6773 }, { "epoch": 0.18, "learning_rate": 1.8766422454604427e-05, "loss": 1.3237, "step": 6774 }, { "epoch": 0.19, "learning_rate": 1.8765996846063456e-05, "loss": 1.4836, "step": 6775 }, { "epoch": 0.19, "learning_rate": 1.8765571168941442e-05, "loss": 1.3975, "step": 6776 }, { "epoch": 0.19, "learning_rate": 1.8765145423241727e-05, "loss": 1.2644, "step": 6777 }, { "epoch": 0.19, "learning_rate": 1.876471960896763e-05, "loss": 1.3313, "step": 6778 }, { "epoch": 0.19, "learning_rate": 1.8764293726122494e-05, "loss": 1.4434, "step": 6779 }, { "epoch": 0.19, "learning_rate": 1.8763867774709644e-05, "loss": 1.4209, "step": 6780 }, { "epoch": 0.19, "learning_rate": 1.876344175473241e-05, "loss": 1.3938, "step": 6781 }, { "epoch": 0.19, "learning_rate": 1.876301566619413e-05, "loss": 1.627, "step": 6782 }, { "epoch": 0.19, "learning_rate": 1.8762589509098137e-05, "loss": 1.2893, "step": 6783 }, { "epoch": 0.19, "learning_rate": 1.8762163283447765e-05, "loss": 1.355, "step": 6784 }, { "epoch": 0.19, "learning_rate": 1.8761736989246346e-05, "loss": 1.3086, "step": 6785 }, { "epoch": 0.19, "learning_rate": 1.876131062649722e-05, "loss": 1.3198, "step": 6786 }, { "epoch": 0.19, "learning_rate": 1.8760884195203718e-05, "loss": 1.1804, "step": 6787 }, { "epoch": 0.19, "learning_rate": 1.8760457695369174e-05, "loss": 1.2969, "step": 6788 }, { "epoch": 0.19, "learning_rate": 1.8760031126996932e-05, "loss": 1.4834, "step": 6789 }, { "epoch": 0.19, "learning_rate": 1.8759604490090322e-05, "loss": 1.4517, "step": 6790 }, { "epoch": 0.19, "learning_rate": 1.8759177784652693e-05, "loss": 1.4426, "step": 6791 }, { "epoch": 0.19, "learning_rate": 1.8758751010687367e-05, "loss": 1.3677, "step": 6792 }, { "epoch": 0.19, "learning_rate": 1.87583241681977e-05, "loss": 1.5913, "step": 6793 }, { "epoch": 0.19, "learning_rate": 1.875789725718702e-05, "loss": 1.353, "step": 6794 }, { "epoch": 0.19, "learning_rate": 1.8757470277658666e-05, "loss": 1.8057, "step": 6795 }, { "epoch": 0.19, "learning_rate": 1.8757043229615986e-05, "loss": 1.2922, "step": 6796 }, { "epoch": 0.19, "learning_rate": 1.875661611306232e-05, "loss": 1.457, "step": 6797 }, { "epoch": 0.19, "learning_rate": 1.8756188928001005e-05, "loss": 1.7598, "step": 6798 }, { "epoch": 0.19, "learning_rate": 1.8755761674435386e-05, "loss": 1.2632, "step": 6799 }, { "epoch": 0.19, "learning_rate": 1.8755334352368802e-05, "loss": 1.3064, "step": 6800 }, { "epoch": 0.19, "learning_rate": 1.8754906961804602e-05, "loss": 1.5181, "step": 6801 }, { "epoch": 0.19, "learning_rate": 1.8754479502746124e-05, "loss": 1.3726, "step": 6802 }, { "epoch": 0.19, "learning_rate": 1.8754051975196716e-05, "loss": 1.4604, "step": 6803 }, { "epoch": 0.19, "learning_rate": 1.8753624379159725e-05, "loss": 1.481, "step": 6804 }, { "epoch": 0.19, "learning_rate": 1.875319671463849e-05, "loss": 1.3843, "step": 6805 }, { "epoch": 0.19, "learning_rate": 1.875276898163636e-05, "loss": 1.4517, "step": 6806 }, { "epoch": 0.19, "learning_rate": 1.8752341180156683e-05, "loss": 1.3879, "step": 6807 }, { "epoch": 0.19, "learning_rate": 1.8751913310202803e-05, "loss": 1.3596, "step": 6808 }, { "epoch": 0.19, "learning_rate": 1.875148537177807e-05, "loss": 1.3479, "step": 6809 }, { "epoch": 0.19, "learning_rate": 1.875105736488583e-05, "loss": 1.5132, "step": 6810 }, { "epoch": 0.19, "learning_rate": 1.875062928952943e-05, "loss": 1.2419, "step": 6811 }, { "epoch": 0.19, "learning_rate": 1.8750201145712223e-05, "loss": 1.2605, "step": 6812 }, { "epoch": 0.19, "learning_rate": 1.8749772933437556e-05, "loss": 1.4014, "step": 6813 }, { "epoch": 0.19, "learning_rate": 1.8749344652708784e-05, "loss": 1.2761, "step": 6814 }, { "epoch": 0.19, "learning_rate": 1.874891630352925e-05, "loss": 1.3914, "step": 6815 }, { "epoch": 0.19, "learning_rate": 1.874848788590231e-05, "loss": 1.4131, "step": 6816 }, { "epoch": 0.19, "learning_rate": 1.8748059399831314e-05, "loss": 1.4348, "step": 6817 }, { "epoch": 0.19, "learning_rate": 1.874763084531961e-05, "loss": 1.384, "step": 6818 }, { "epoch": 0.19, "learning_rate": 1.8747202222370565e-05, "loss": 1.5076, "step": 6819 }, { "epoch": 0.19, "learning_rate": 1.874677353098752e-05, "loss": 1.4485, "step": 6820 }, { "epoch": 0.19, "learning_rate": 1.874634477117383e-05, "loss": 1.2527, "step": 6821 }, { "epoch": 0.19, "learning_rate": 1.874591594293285e-05, "loss": 1.3662, "step": 6822 }, { "epoch": 0.19, "learning_rate": 1.874548704626794e-05, "loss": 1.374, "step": 6823 }, { "epoch": 0.19, "learning_rate": 1.874505808118245e-05, "loss": 1.4119, "step": 6824 }, { "epoch": 0.19, "learning_rate": 1.8744629047679738e-05, "loss": 1.291, "step": 6825 }, { "epoch": 0.19, "learning_rate": 1.874419994576316e-05, "loss": 1.2083, "step": 6826 }, { "epoch": 0.19, "learning_rate": 1.8743770775436074e-05, "loss": 1.4568, "step": 6827 }, { "epoch": 0.19, "learning_rate": 1.8743341536701837e-05, "loss": 1.4761, "step": 6828 }, { "epoch": 0.19, "learning_rate": 1.8742912229563807e-05, "loss": 1.4336, "step": 6829 }, { "epoch": 0.19, "learning_rate": 1.8742482854025343e-05, "loss": 1.4341, "step": 6830 }, { "epoch": 0.19, "learning_rate": 1.87420534100898e-05, "loss": 1.5247, "step": 6831 }, { "epoch": 0.19, "learning_rate": 1.874162389776055e-05, "loss": 1.4304, "step": 6832 }, { "epoch": 0.19, "learning_rate": 1.8741194317040942e-05, "loss": 1.4297, "step": 6833 }, { "epoch": 0.19, "learning_rate": 1.874076466793434e-05, "loss": 1.4614, "step": 6834 }, { "epoch": 0.19, "learning_rate": 1.8740334950444104e-05, "loss": 1.4214, "step": 6835 }, { "epoch": 0.19, "learning_rate": 1.8739905164573596e-05, "loss": 1.365, "step": 6836 }, { "epoch": 0.19, "learning_rate": 1.8739475310326184e-05, "loss": 1.2175, "step": 6837 }, { "epoch": 0.19, "learning_rate": 1.8739045387705223e-05, "loss": 1.3452, "step": 6838 }, { "epoch": 0.19, "learning_rate": 1.8738615396714083e-05, "loss": 1.2246, "step": 6839 }, { "epoch": 0.19, "learning_rate": 1.873818533735612e-05, "loss": 1.3872, "step": 6840 }, { "epoch": 0.19, "learning_rate": 1.873775520963471e-05, "loss": 1.5107, "step": 6841 }, { "epoch": 0.19, "learning_rate": 1.8737325013553208e-05, "loss": 1.4678, "step": 6842 }, { "epoch": 0.19, "learning_rate": 1.873689474911499e-05, "loss": 1.4766, "step": 6843 }, { "epoch": 0.19, "learning_rate": 1.873646441632341e-05, "loss": 1.196, "step": 6844 }, { "epoch": 0.19, "learning_rate": 1.8736034015181844e-05, "loss": 1.3694, "step": 6845 }, { "epoch": 0.19, "learning_rate": 1.8735603545693653e-05, "loss": 1.4263, "step": 6846 }, { "epoch": 0.19, "learning_rate": 1.873517300786221e-05, "loss": 1.3086, "step": 6847 }, { "epoch": 0.19, "learning_rate": 1.8734742401690878e-05, "loss": 1.4048, "step": 6848 }, { "epoch": 0.19, "learning_rate": 1.873431172718303e-05, "loss": 1.4631, "step": 6849 }, { "epoch": 0.19, "learning_rate": 1.8733880984342035e-05, "loss": 1.3064, "step": 6850 }, { "epoch": 0.19, "learning_rate": 1.873345017317126e-05, "loss": 1.3896, "step": 6851 }, { "epoch": 0.19, "learning_rate": 1.8733019293674082e-05, "loss": 1.3857, "step": 6852 }, { "epoch": 0.19, "learning_rate": 1.8732588345853864e-05, "loss": 1.3252, "step": 6853 }, { "epoch": 0.19, "learning_rate": 1.8732157329713984e-05, "loss": 1.8589, "step": 6854 }, { "epoch": 0.19, "learning_rate": 1.8731726245257807e-05, "loss": 1.4163, "step": 6855 }, { "epoch": 0.19, "learning_rate": 1.873129509248871e-05, "loss": 1.3323, "step": 6856 }, { "epoch": 0.19, "learning_rate": 1.8730863871410074e-05, "loss": 1.2922, "step": 6857 }, { "epoch": 0.19, "learning_rate": 1.8730432582025256e-05, "loss": 1.3652, "step": 6858 }, { "epoch": 0.19, "learning_rate": 1.873000122433764e-05, "loss": 1.5249, "step": 6859 }, { "epoch": 0.19, "learning_rate": 1.8729569798350602e-05, "loss": 1.4419, "step": 6860 }, { "epoch": 0.19, "learning_rate": 1.8729138304067512e-05, "loss": 1.2996, "step": 6861 }, { "epoch": 0.19, "learning_rate": 1.872870674149175e-05, "loss": 1.2297, "step": 6862 }, { "epoch": 0.19, "learning_rate": 1.8728275110626694e-05, "loss": 1.4155, "step": 6863 }, { "epoch": 0.19, "learning_rate": 1.8727843411475715e-05, "loss": 1.4395, "step": 6864 }, { "epoch": 0.19, "learning_rate": 1.8727411644042192e-05, "loss": 1.4529, "step": 6865 }, { "epoch": 0.19, "learning_rate": 1.8726979808329506e-05, "loss": 1.2849, "step": 6866 }, { "epoch": 0.19, "learning_rate": 1.8726547904341034e-05, "loss": 1.3965, "step": 6867 }, { "epoch": 0.19, "learning_rate": 1.8726115932080152e-05, "loss": 1.2371, "step": 6868 }, { "epoch": 0.19, "learning_rate": 1.8725683891550247e-05, "loss": 1.4158, "step": 6869 }, { "epoch": 0.19, "learning_rate": 1.872525178275469e-05, "loss": 1.3667, "step": 6870 }, { "epoch": 0.19, "learning_rate": 1.872481960569687e-05, "loss": 1.4172, "step": 6871 }, { "epoch": 0.19, "learning_rate": 1.8724387360380163e-05, "loss": 1.4177, "step": 6872 }, { "epoch": 0.19, "learning_rate": 1.872395504680795e-05, "loss": 1.4578, "step": 6873 }, { "epoch": 0.19, "learning_rate": 1.8723522664983617e-05, "loss": 1.334, "step": 6874 }, { "epoch": 0.19, "learning_rate": 1.872309021491054e-05, "loss": 1.5198, "step": 6875 }, { "epoch": 0.19, "learning_rate": 1.8722657696592112e-05, "loss": 1.5381, "step": 6876 }, { "epoch": 0.19, "learning_rate": 1.872222511003171e-05, "loss": 1.4597, "step": 6877 }, { "epoch": 0.19, "learning_rate": 1.872179245523272e-05, "loss": 1.3921, "step": 6878 }, { "epoch": 0.19, "learning_rate": 1.872135973219853e-05, "loss": 1.2681, "step": 6879 }, { "epoch": 0.19, "learning_rate": 1.872092694093252e-05, "loss": 1.4243, "step": 6880 }, { "epoch": 0.19, "learning_rate": 1.872049408143808e-05, "loss": 1.2285, "step": 6881 }, { "epoch": 0.19, "learning_rate": 1.872006115371859e-05, "loss": 1.323, "step": 6882 }, { "epoch": 0.19, "learning_rate": 1.8719628157777447e-05, "loss": 1.4673, "step": 6883 }, { "epoch": 0.19, "learning_rate": 1.8719195093618034e-05, "loss": 1.5308, "step": 6884 }, { "epoch": 0.19, "learning_rate": 1.8718761961243737e-05, "loss": 1.4885, "step": 6885 }, { "epoch": 0.19, "learning_rate": 1.8718328760657945e-05, "loss": 1.4351, "step": 6886 }, { "epoch": 0.19, "learning_rate": 1.871789549186405e-05, "loss": 1.4519, "step": 6887 }, { "epoch": 0.19, "learning_rate": 1.8717462154865437e-05, "loss": 1.4878, "step": 6888 }, { "epoch": 0.19, "learning_rate": 1.8717028749665504e-05, "loss": 1.4836, "step": 6889 }, { "epoch": 0.19, "learning_rate": 1.8716595276267635e-05, "loss": 1.4521, "step": 6890 }, { "epoch": 0.19, "learning_rate": 1.871616173467522e-05, "loss": 1.4563, "step": 6891 }, { "epoch": 0.19, "learning_rate": 1.8715728124891658e-05, "loss": 1.4998, "step": 6892 }, { "epoch": 0.19, "learning_rate": 1.871529444692034e-05, "loss": 1.8047, "step": 6893 }, { "epoch": 0.19, "learning_rate": 1.8714860700764652e-05, "loss": 1.3464, "step": 6894 }, { "epoch": 0.19, "learning_rate": 1.8714426886427995e-05, "loss": 1.4385, "step": 6895 }, { "epoch": 0.19, "learning_rate": 1.8713993003913758e-05, "loss": 1.3298, "step": 6896 }, { "epoch": 0.19, "learning_rate": 1.871355905322534e-05, "loss": 1.5024, "step": 6897 }, { "epoch": 0.19, "learning_rate": 1.871312503436613e-05, "loss": 1.3784, "step": 6898 }, { "epoch": 0.19, "learning_rate": 1.8712690947339528e-05, "loss": 1.4561, "step": 6899 }, { "epoch": 0.19, "learning_rate": 1.871225679214893e-05, "loss": 1.3765, "step": 6900 }, { "epoch": 0.19, "learning_rate": 1.8711822568797728e-05, "loss": 1.3931, "step": 6901 }, { "epoch": 0.19, "learning_rate": 1.871138827728933e-05, "loss": 1.448, "step": 6902 }, { "epoch": 0.19, "learning_rate": 1.871095391762712e-05, "loss": 1.5278, "step": 6903 }, { "epoch": 0.19, "learning_rate": 1.8710519489814503e-05, "loss": 1.24, "step": 6904 }, { "epoch": 0.19, "learning_rate": 1.871008499385488e-05, "loss": 1.2344, "step": 6905 }, { "epoch": 0.19, "learning_rate": 1.8709650429751647e-05, "loss": 1.3633, "step": 6906 }, { "epoch": 0.19, "learning_rate": 1.8709215797508203e-05, "loss": 1.4976, "step": 6907 }, { "epoch": 0.19, "learning_rate": 1.8708781097127954e-05, "loss": 1.2769, "step": 6908 }, { "epoch": 0.19, "learning_rate": 1.8708346328614297e-05, "loss": 1.4375, "step": 6909 }, { "epoch": 0.19, "learning_rate": 1.8707911491970628e-05, "loss": 1.2937, "step": 6910 }, { "epoch": 0.19, "learning_rate": 1.8707476587200357e-05, "loss": 1.2468, "step": 6911 }, { "epoch": 0.19, "learning_rate": 1.8707041614306885e-05, "loss": 1.353, "step": 6912 }, { "epoch": 0.19, "learning_rate": 1.870660657329361e-05, "loss": 1.4875, "step": 6913 }, { "epoch": 0.19, "learning_rate": 1.8706171464163943e-05, "loss": 1.3442, "step": 6914 }, { "epoch": 0.19, "learning_rate": 1.8705736286921282e-05, "loss": 1.4167, "step": 6915 }, { "epoch": 0.19, "learning_rate": 1.8705301041569038e-05, "loss": 1.3528, "step": 6916 }, { "epoch": 0.19, "learning_rate": 1.8704865728110608e-05, "loss": 1.4233, "step": 6917 }, { "epoch": 0.19, "learning_rate": 1.8704430346549404e-05, "loss": 1.428, "step": 6918 }, { "epoch": 0.19, "learning_rate": 1.8703994896888828e-05, "loss": 1.3909, "step": 6919 }, { "epoch": 0.19, "learning_rate": 1.870355937913229e-05, "loss": 1.3455, "step": 6920 }, { "epoch": 0.19, "learning_rate": 1.8703123793283198e-05, "loss": 1.429, "step": 6921 }, { "epoch": 0.19, "learning_rate": 1.8702688139344953e-05, "loss": 1.3293, "step": 6922 }, { "epoch": 0.19, "learning_rate": 1.870225241732097e-05, "loss": 1.4209, "step": 6923 }, { "epoch": 0.19, "learning_rate": 1.870181662721466e-05, "loss": 1.1968, "step": 6924 }, { "epoch": 0.19, "learning_rate": 1.8701380769029428e-05, "loss": 1.3772, "step": 6925 }, { "epoch": 0.19, "learning_rate": 1.870094484276868e-05, "loss": 1.313, "step": 6926 }, { "epoch": 0.19, "learning_rate": 1.8700508848435834e-05, "loss": 1.3457, "step": 6927 }, { "epoch": 0.19, "learning_rate": 1.87000727860343e-05, "loss": 1.3879, "step": 6928 }, { "epoch": 0.19, "learning_rate": 1.8699636655567483e-05, "loss": 1.4077, "step": 6929 }, { "epoch": 0.19, "learning_rate": 1.8699200457038804e-05, "loss": 1.5063, "step": 6930 }, { "epoch": 0.19, "learning_rate": 1.8698764190451668e-05, "loss": 1.4763, "step": 6931 }, { "epoch": 0.19, "learning_rate": 1.8698327855809493e-05, "loss": 1.4758, "step": 6932 }, { "epoch": 0.19, "learning_rate": 1.8697891453115692e-05, "loss": 1.4968, "step": 6933 }, { "epoch": 0.19, "learning_rate": 1.8697454982373677e-05, "loss": 1.3447, "step": 6934 }, { "epoch": 0.19, "learning_rate": 1.869701844358686e-05, "loss": 1.4216, "step": 6935 }, { "epoch": 0.19, "learning_rate": 1.869658183675867e-05, "loss": 1.2998, "step": 6936 }, { "epoch": 0.19, "learning_rate": 1.8696145161892508e-05, "loss": 1.5125, "step": 6937 }, { "epoch": 0.19, "learning_rate": 1.8695708418991793e-05, "loss": 1.2603, "step": 6938 }, { "epoch": 0.19, "learning_rate": 1.8695271608059946e-05, "loss": 1.3164, "step": 6939 }, { "epoch": 0.19, "learning_rate": 1.8694834729100386e-05, "loss": 1.1948, "step": 6940 }, { "epoch": 0.19, "learning_rate": 1.8694397782116525e-05, "loss": 1.4678, "step": 6941 }, { "epoch": 0.19, "learning_rate": 1.8693960767111782e-05, "loss": 1.4062, "step": 6942 }, { "epoch": 0.19, "learning_rate": 1.869352368408958e-05, "loss": 1.2593, "step": 6943 }, { "epoch": 0.19, "learning_rate": 1.869308653305334e-05, "loss": 1.4614, "step": 6944 }, { "epoch": 0.19, "learning_rate": 1.8692649314006473e-05, "loss": 1.3472, "step": 6945 }, { "epoch": 0.19, "learning_rate": 1.869221202695241e-05, "loss": 1.5249, "step": 6946 }, { "epoch": 0.19, "learning_rate": 1.8691774671894562e-05, "loss": 1.4619, "step": 6947 }, { "epoch": 0.19, "learning_rate": 1.8691337248836362e-05, "loss": 1.4678, "step": 6948 }, { "epoch": 0.19, "learning_rate": 1.8690899757781223e-05, "loss": 1.292, "step": 6949 }, { "epoch": 0.19, "learning_rate": 1.8690462198732574e-05, "loss": 1.4849, "step": 6950 }, { "epoch": 0.19, "learning_rate": 1.869002457169383e-05, "loss": 1.3003, "step": 6951 }, { "epoch": 0.19, "learning_rate": 1.8689586876668424e-05, "loss": 1.1655, "step": 6952 }, { "epoch": 0.19, "learning_rate": 1.8689149113659778e-05, "loss": 1.4292, "step": 6953 }, { "epoch": 0.19, "learning_rate": 1.8688711282671313e-05, "loss": 1.4067, "step": 6954 }, { "epoch": 0.19, "learning_rate": 1.8688273383706455e-05, "loss": 1.5093, "step": 6955 }, { "epoch": 0.19, "learning_rate": 1.8687835416768633e-05, "loss": 1.4736, "step": 6956 }, { "epoch": 0.19, "learning_rate": 1.8687397381861272e-05, "loss": 1.3384, "step": 6957 }, { "epoch": 0.19, "learning_rate": 1.86869592789878e-05, "loss": 1.366, "step": 6958 }, { "epoch": 0.19, "learning_rate": 1.8686521108151642e-05, "loss": 1.2622, "step": 6959 }, { "epoch": 0.19, "learning_rate": 1.8686082869356227e-05, "loss": 1.4736, "step": 6960 }, { "epoch": 0.19, "learning_rate": 1.8685644562604986e-05, "loss": 1.3208, "step": 6961 }, { "epoch": 0.19, "learning_rate": 1.8685206187901345e-05, "loss": 1.4263, "step": 6962 }, { "epoch": 0.19, "learning_rate": 1.8684767745248736e-05, "loss": 1.3853, "step": 6963 }, { "epoch": 0.19, "learning_rate": 1.868432923465059e-05, "loss": 1.3621, "step": 6964 }, { "epoch": 0.19, "learning_rate": 1.8683890656110334e-05, "loss": 1.437, "step": 6965 }, { "epoch": 0.19, "learning_rate": 1.86834520096314e-05, "loss": 1.3291, "step": 6966 }, { "epoch": 0.19, "learning_rate": 1.868301329521722e-05, "loss": 1.4636, "step": 6967 }, { "epoch": 0.19, "learning_rate": 1.8682574512871225e-05, "loss": 1.4211, "step": 6968 }, { "epoch": 0.19, "learning_rate": 1.8682135662596854e-05, "loss": 1.2461, "step": 6969 }, { "epoch": 0.19, "learning_rate": 1.8681696744397535e-05, "loss": 1.0378, "step": 6970 }, { "epoch": 0.19, "learning_rate": 1.8681257758276704e-05, "loss": 1.4702, "step": 6971 }, { "epoch": 0.19, "learning_rate": 1.868081870423779e-05, "loss": 1.3872, "step": 6972 }, { "epoch": 0.19, "learning_rate": 1.868037958228424e-05, "loss": 1.4019, "step": 6973 }, { "epoch": 0.19, "learning_rate": 1.8679940392419475e-05, "loss": 1.2639, "step": 6974 }, { "epoch": 0.19, "learning_rate": 1.867950113464694e-05, "loss": 1.2761, "step": 6975 }, { "epoch": 0.19, "learning_rate": 1.8679061808970074e-05, "loss": 1.4453, "step": 6976 }, { "epoch": 0.19, "learning_rate": 1.8678622415392304e-05, "loss": 1.3691, "step": 6977 }, { "epoch": 0.19, "learning_rate": 1.8678182953917078e-05, "loss": 1.2764, "step": 6978 }, { "epoch": 0.19, "learning_rate": 1.8677743424547824e-05, "loss": 1.3979, "step": 6979 }, { "epoch": 0.19, "learning_rate": 1.867730382728799e-05, "loss": 1.4536, "step": 6980 }, { "epoch": 0.19, "learning_rate": 1.867686416214101e-05, "loss": 1.3337, "step": 6981 }, { "epoch": 0.19, "learning_rate": 1.8676424429110325e-05, "loss": 1.375, "step": 6982 }, { "epoch": 0.19, "learning_rate": 1.867598462819937e-05, "loss": 1.3662, "step": 6983 }, { "epoch": 0.19, "learning_rate": 1.86755447594116e-05, "loss": 1.4668, "step": 6984 }, { "epoch": 0.19, "learning_rate": 1.867510482275044e-05, "loss": 1.4373, "step": 6985 }, { "epoch": 0.19, "learning_rate": 1.8674664818219344e-05, "loss": 1.4893, "step": 6986 }, { "epoch": 0.19, "learning_rate": 1.867422474582175e-05, "loss": 1.3831, "step": 6987 }, { "epoch": 0.19, "learning_rate": 1.86737846055611e-05, "loss": 1.3889, "step": 6988 }, { "epoch": 0.19, "learning_rate": 1.8673344397440832e-05, "loss": 1.3247, "step": 6989 }, { "epoch": 0.19, "learning_rate": 1.8672904121464402e-05, "loss": 1.4766, "step": 6990 }, { "epoch": 0.19, "learning_rate": 1.8672463777635246e-05, "loss": 1.4744, "step": 6991 }, { "epoch": 0.19, "learning_rate": 1.8672023365956814e-05, "loss": 1.4128, "step": 6992 }, { "epoch": 0.19, "learning_rate": 1.8671582886432546e-05, "loss": 1.5459, "step": 6993 }, { "epoch": 0.19, "learning_rate": 1.8671142339065893e-05, "loss": 1.4497, "step": 6994 }, { "epoch": 0.19, "learning_rate": 1.86707017238603e-05, "loss": 1.342, "step": 6995 }, { "epoch": 0.19, "learning_rate": 1.8670261040819212e-05, "loss": 1.3403, "step": 6996 }, { "epoch": 0.19, "learning_rate": 1.866982028994608e-05, "loss": 1.3499, "step": 6997 }, { "epoch": 0.19, "learning_rate": 1.866937947124435e-05, "loss": 1.3713, "step": 6998 }, { "epoch": 0.19, "learning_rate": 1.8668938584717473e-05, "loss": 1.4236, "step": 6999 }, { "epoch": 0.19, "learning_rate": 1.8668497630368897e-05, "loss": 1.4482, "step": 7000 }, { "epoch": 0.19, "learning_rate": 1.866805660820207e-05, "loss": 1.5093, "step": 7001 }, { "epoch": 0.19, "learning_rate": 1.8667615518220444e-05, "loss": 1.4575, "step": 7002 }, { "epoch": 0.19, "learning_rate": 1.8667174360427473e-05, "loss": 1.355, "step": 7003 }, { "epoch": 0.19, "learning_rate": 1.8666733134826604e-05, "loss": 1.2983, "step": 7004 }, { "epoch": 0.19, "learning_rate": 1.866629184142129e-05, "loss": 1.4795, "step": 7005 }, { "epoch": 0.19, "learning_rate": 1.8665850480214986e-05, "loss": 1.397, "step": 7006 }, { "epoch": 0.19, "learning_rate": 1.8665409051211138e-05, "loss": 1.4243, "step": 7007 }, { "epoch": 0.19, "learning_rate": 1.866496755441321e-05, "loss": 1.4185, "step": 7008 }, { "epoch": 0.19, "learning_rate": 1.8664525989824646e-05, "loss": 1.4353, "step": 7009 }, { "epoch": 0.19, "learning_rate": 1.8664084357448903e-05, "loss": 1.2744, "step": 7010 }, { "epoch": 0.19, "learning_rate": 1.8663642657289443e-05, "loss": 1.4414, "step": 7011 }, { "epoch": 0.19, "learning_rate": 1.8663200889349715e-05, "loss": 1.2344, "step": 7012 }, { "epoch": 0.19, "learning_rate": 1.8662759053633176e-05, "loss": 1.47, "step": 7013 }, { "epoch": 0.19, "learning_rate": 1.8662317150143287e-05, "loss": 1.439, "step": 7014 }, { "epoch": 0.19, "learning_rate": 1.86618751788835e-05, "loss": 1.4932, "step": 7015 }, { "epoch": 0.19, "learning_rate": 1.8661433139857273e-05, "loss": 1.3486, "step": 7016 }, { "epoch": 0.19, "learning_rate": 1.866099103306807e-05, "loss": 1.3765, "step": 7017 }, { "epoch": 0.19, "learning_rate": 1.8660548858519344e-05, "loss": 1.3491, "step": 7018 }, { "epoch": 0.19, "learning_rate": 1.8660106616214552e-05, "loss": 1.3525, "step": 7019 }, { "epoch": 0.19, "learning_rate": 1.8659664306157164e-05, "loss": 1.4109, "step": 7020 }, { "epoch": 0.19, "learning_rate": 1.865922192835063e-05, "loss": 1.23, "step": 7021 }, { "epoch": 0.19, "learning_rate": 1.865877948279842e-05, "loss": 1.468, "step": 7022 }, { "epoch": 0.19, "learning_rate": 1.8658336969503987e-05, "loss": 1.3301, "step": 7023 }, { "epoch": 0.19, "learning_rate": 1.86578943884708e-05, "loss": 1.449, "step": 7024 }, { "epoch": 0.19, "learning_rate": 1.8657451739702317e-05, "loss": 1.3765, "step": 7025 }, { "epoch": 0.19, "learning_rate": 1.8657009023202003e-05, "loss": 1.2832, "step": 7026 }, { "epoch": 0.19, "learning_rate": 1.865656623897332e-05, "loss": 1.488, "step": 7027 }, { "epoch": 0.19, "learning_rate": 1.8656123387019737e-05, "loss": 1.4404, "step": 7028 }, { "epoch": 0.19, "learning_rate": 1.8655680467344713e-05, "loss": 1.4619, "step": 7029 }, { "epoch": 0.19, "learning_rate": 1.8655237479951712e-05, "loss": 1.4314, "step": 7030 }, { "epoch": 0.19, "learning_rate": 1.8654794424844204e-05, "loss": 1.3252, "step": 7031 }, { "epoch": 0.19, "learning_rate": 1.865435130202566e-05, "loss": 1.509, "step": 7032 }, { "epoch": 0.19, "learning_rate": 1.8653908111499534e-05, "loss": 1.3069, "step": 7033 }, { "epoch": 0.19, "learning_rate": 1.8653464853269304e-05, "loss": 1.7881, "step": 7034 }, { "epoch": 0.19, "learning_rate": 1.8653021527338434e-05, "loss": 1.4478, "step": 7035 }, { "epoch": 0.19, "learning_rate": 1.865257813371039e-05, "loss": 1.5, "step": 7036 }, { "epoch": 0.19, "learning_rate": 1.8652134672388645e-05, "loss": 1.2322, "step": 7037 }, { "epoch": 0.19, "learning_rate": 1.8651691143376666e-05, "loss": 1.4292, "step": 7038 }, { "epoch": 0.19, "learning_rate": 1.8651247546677928e-05, "loss": 1.6929, "step": 7039 }, { "epoch": 0.19, "learning_rate": 1.865080388229589e-05, "loss": 1.4326, "step": 7040 }, { "epoch": 0.19, "learning_rate": 1.8650360150234033e-05, "loss": 1.3633, "step": 7041 }, { "epoch": 0.19, "learning_rate": 1.8649916350495833e-05, "loss": 1.4109, "step": 7042 }, { "epoch": 0.19, "learning_rate": 1.864947248308475e-05, "loss": 1.3718, "step": 7043 }, { "epoch": 0.19, "learning_rate": 1.8649028548004256e-05, "loss": 1.356, "step": 7044 }, { "epoch": 0.19, "learning_rate": 1.8648584545257835e-05, "loss": 1.6121, "step": 7045 }, { "epoch": 0.19, "learning_rate": 1.8648140474848955e-05, "loss": 1.2898, "step": 7046 }, { "epoch": 0.19, "learning_rate": 1.8647696336781093e-05, "loss": 1.2754, "step": 7047 }, { "epoch": 0.19, "learning_rate": 1.8647252131057717e-05, "loss": 1.4209, "step": 7048 }, { "epoch": 0.19, "learning_rate": 1.8646807857682308e-05, "loss": 1.2839, "step": 7049 }, { "epoch": 0.19, "learning_rate": 1.8646363516658338e-05, "loss": 1.2656, "step": 7050 }, { "epoch": 0.19, "learning_rate": 1.864591910798929e-05, "loss": 1.2239, "step": 7051 }, { "epoch": 0.19, "learning_rate": 1.8645474631678634e-05, "loss": 1.4268, "step": 7052 }, { "epoch": 0.19, "learning_rate": 1.8645030087729852e-05, "loss": 1.4648, "step": 7053 }, { "epoch": 0.19, "learning_rate": 1.864458547614642e-05, "loss": 1.3809, "step": 7054 }, { "epoch": 0.19, "learning_rate": 1.8644140796931812e-05, "loss": 1.4163, "step": 7055 }, { "epoch": 0.19, "learning_rate": 1.8643696050089515e-05, "loss": 1.2849, "step": 7056 }, { "epoch": 0.19, "learning_rate": 1.8643251235623e-05, "loss": 1.4368, "step": 7057 }, { "epoch": 0.19, "learning_rate": 1.8642806353535757e-05, "loss": 1.3555, "step": 7058 }, { "epoch": 0.19, "learning_rate": 1.8642361403831258e-05, "loss": 1.4167, "step": 7059 }, { "epoch": 0.19, "learning_rate": 1.864191638651299e-05, "loss": 1.4348, "step": 7060 }, { "epoch": 0.19, "learning_rate": 1.864147130158443e-05, "loss": 1.4426, "step": 7061 }, { "epoch": 0.19, "learning_rate": 1.864102614904906e-05, "loss": 1.4131, "step": 7062 }, { "epoch": 0.19, "learning_rate": 1.8640580928910368e-05, "loss": 1.4011, "step": 7063 }, { "epoch": 0.19, "learning_rate": 1.8640135641171836e-05, "loss": 1.427, "step": 7064 }, { "epoch": 0.19, "learning_rate": 1.8639690285836943e-05, "loss": 1.3994, "step": 7065 }, { "epoch": 0.19, "learning_rate": 1.8639244862909173e-05, "loss": 1.4209, "step": 7066 }, { "epoch": 0.19, "learning_rate": 1.8638799372392017e-05, "loss": 1.4778, "step": 7067 }, { "epoch": 0.19, "learning_rate": 1.8638353814288956e-05, "loss": 1.4287, "step": 7068 }, { "epoch": 0.19, "learning_rate": 1.8637908188603475e-05, "loss": 1.4509, "step": 7069 }, { "epoch": 0.19, "learning_rate": 1.8637462495339065e-05, "loss": 1.2839, "step": 7070 }, { "epoch": 0.19, "learning_rate": 1.863701673449921e-05, "loss": 1.321, "step": 7071 }, { "epoch": 0.19, "learning_rate": 1.8636570906087398e-05, "loss": 1.4614, "step": 7072 }, { "epoch": 0.19, "learning_rate": 1.8636125010107113e-05, "loss": 1.4753, "step": 7073 }, { "epoch": 0.19, "learning_rate": 1.863567904656185e-05, "loss": 1.3398, "step": 7074 }, { "epoch": 0.19, "learning_rate": 1.8635233015455093e-05, "loss": 1.3706, "step": 7075 }, { "epoch": 0.19, "learning_rate": 1.8634786916790334e-05, "loss": 1.2869, "step": 7076 }, { "epoch": 0.19, "learning_rate": 1.863434075057106e-05, "loss": 1.3191, "step": 7077 }, { "epoch": 0.19, "learning_rate": 1.8633894516800773e-05, "loss": 1.3716, "step": 7078 }, { "epoch": 0.19, "learning_rate": 1.8633448215482947e-05, "loss": 1.2236, "step": 7079 }, { "epoch": 0.19, "learning_rate": 1.8633001846621085e-05, "loss": 1.3396, "step": 7080 }, { "epoch": 0.19, "learning_rate": 1.8632555410218675e-05, "loss": 1.2773, "step": 7081 }, { "epoch": 0.19, "learning_rate": 1.8632108906279208e-05, "loss": 1.5093, "step": 7082 }, { "epoch": 0.19, "learning_rate": 1.8631662334806187e-05, "loss": 1.3477, "step": 7083 }, { "epoch": 0.19, "learning_rate": 1.8631215695803092e-05, "loss": 1.4907, "step": 7084 }, { "epoch": 0.19, "learning_rate": 1.863076898927343e-05, "loss": 1.4883, "step": 7085 }, { "epoch": 0.19, "learning_rate": 1.8630322215220684e-05, "loss": 1.1285, "step": 7086 }, { "epoch": 0.19, "learning_rate": 1.862987537364836e-05, "loss": 1.2847, "step": 7087 }, { "epoch": 0.19, "learning_rate": 1.8629428464559948e-05, "loss": 1.2649, "step": 7088 }, { "epoch": 0.19, "learning_rate": 1.8628981487958942e-05, "loss": 1.3674, "step": 7089 }, { "epoch": 0.19, "learning_rate": 1.8628534443848848e-05, "loss": 1.262, "step": 7090 }, { "epoch": 0.19, "learning_rate": 1.8628087332233152e-05, "loss": 1.6562, "step": 7091 }, { "epoch": 0.19, "learning_rate": 1.862764015311536e-05, "loss": 1.5239, "step": 7092 }, { "epoch": 0.19, "learning_rate": 1.862719290649897e-05, "loss": 1.4104, "step": 7093 }, { "epoch": 0.19, "learning_rate": 1.862674559238748e-05, "loss": 1.481, "step": 7094 }, { "epoch": 0.19, "learning_rate": 1.862629821078439e-05, "loss": 1.1443, "step": 7095 }, { "epoch": 0.19, "learning_rate": 1.8625850761693196e-05, "loss": 1.4302, "step": 7096 }, { "epoch": 0.19, "learning_rate": 1.8625403245117404e-05, "loss": 1.4568, "step": 7097 }, { "epoch": 0.19, "learning_rate": 1.862495566106051e-05, "loss": 1.4846, "step": 7098 }, { "epoch": 0.19, "learning_rate": 1.862450800952602e-05, "loss": 1.3719, "step": 7099 }, { "epoch": 0.19, "learning_rate": 1.8624060290517438e-05, "loss": 1.5015, "step": 7100 }, { "epoch": 0.19, "learning_rate": 1.8623612504038263e-05, "loss": 1.4468, "step": 7101 }, { "epoch": 0.19, "learning_rate": 1.8623164650091996e-05, "loss": 1.5227, "step": 7102 }, { "epoch": 0.19, "learning_rate": 1.8622716728682144e-05, "loss": 1.4197, "step": 7103 }, { "epoch": 0.19, "learning_rate": 1.8622268739812212e-05, "loss": 1.5488, "step": 7104 }, { "epoch": 0.19, "learning_rate": 1.86218206834857e-05, "loss": 1.375, "step": 7105 }, { "epoch": 0.19, "learning_rate": 1.8621372559706125e-05, "loss": 1.3464, "step": 7106 }, { "epoch": 0.19, "learning_rate": 1.862092436847698e-05, "loss": 1.4648, "step": 7107 }, { "epoch": 0.19, "learning_rate": 1.862047610980178e-05, "loss": 1.3882, "step": 7108 }, { "epoch": 0.19, "learning_rate": 1.8620027783684022e-05, "loss": 1.2581, "step": 7109 }, { "epoch": 0.19, "learning_rate": 1.8619579390127224e-05, "loss": 1.334, "step": 7110 }, { "epoch": 0.19, "learning_rate": 1.861913092913489e-05, "loss": 1.2825, "step": 7111 }, { "epoch": 0.19, "learning_rate": 1.8618682400710527e-05, "loss": 1.3213, "step": 7112 }, { "epoch": 0.19, "learning_rate": 1.861823380485765e-05, "loss": 1.3984, "step": 7113 }, { "epoch": 0.19, "learning_rate": 1.861778514157976e-05, "loss": 1.3213, "step": 7114 }, { "epoch": 0.19, "learning_rate": 1.8617336410880376e-05, "loss": 1.6946, "step": 7115 }, { "epoch": 0.19, "learning_rate": 1.8616887612763e-05, "loss": 1.5093, "step": 7116 }, { "epoch": 0.19, "learning_rate": 1.861643874723115e-05, "loss": 1.3948, "step": 7117 }, { "epoch": 0.19, "learning_rate": 1.8615989814288333e-05, "loss": 1.5098, "step": 7118 }, { "epoch": 0.19, "learning_rate": 1.8615540813938063e-05, "loss": 1.3816, "step": 7119 }, { "epoch": 0.19, "learning_rate": 1.8615091746183852e-05, "loss": 1.5391, "step": 7120 }, { "epoch": 0.19, "learning_rate": 1.8614642611029217e-05, "loss": 1.5056, "step": 7121 }, { "epoch": 0.19, "learning_rate": 1.8614193408477668e-05, "loss": 1.3936, "step": 7122 }, { "epoch": 0.19, "learning_rate": 1.8613744138532718e-05, "loss": 1.3921, "step": 7123 }, { "epoch": 0.19, "learning_rate": 1.861329480119789e-05, "loss": 1.2354, "step": 7124 }, { "epoch": 0.19, "learning_rate": 1.8612845396476687e-05, "loss": 1.4297, "step": 7125 }, { "epoch": 0.19, "learning_rate": 1.8612395924372637e-05, "loss": 1.3782, "step": 7126 }, { "epoch": 0.19, "learning_rate": 1.8611946384889253e-05, "loss": 1.4883, "step": 7127 }, { "epoch": 0.19, "learning_rate": 1.8611496778030044e-05, "loss": 1.4404, "step": 7128 }, { "epoch": 0.19, "learning_rate": 1.8611047103798535e-05, "loss": 1.1389, "step": 7129 }, { "epoch": 0.19, "learning_rate": 1.8610597362198244e-05, "loss": 1.4067, "step": 7130 }, { "epoch": 0.19, "learning_rate": 1.861014755323269e-05, "loss": 1.4277, "step": 7131 }, { "epoch": 0.19, "learning_rate": 1.8609697676905388e-05, "loss": 1.4436, "step": 7132 }, { "epoch": 0.19, "learning_rate": 1.860924773321986e-05, "loss": 1.3105, "step": 7133 }, { "epoch": 0.19, "learning_rate": 1.8608797722179626e-05, "loss": 1.4038, "step": 7134 }, { "epoch": 0.19, "learning_rate": 1.8608347643788206e-05, "loss": 1.3384, "step": 7135 }, { "epoch": 0.19, "learning_rate": 1.8607897498049122e-05, "loss": 1.4722, "step": 7136 }, { "epoch": 0.19, "learning_rate": 1.8607447284965898e-05, "loss": 1.2141, "step": 7137 }, { "epoch": 0.19, "learning_rate": 1.8606997004542053e-05, "loss": 1.4165, "step": 7138 }, { "epoch": 0.19, "learning_rate": 1.860654665678111e-05, "loss": 1.3953, "step": 7139 }, { "epoch": 0.19, "learning_rate": 1.8606096241686595e-05, "loss": 1.293, "step": 7140 }, { "epoch": 0.2, "learning_rate": 1.8605645759262028e-05, "loss": 1.2749, "step": 7141 }, { "epoch": 0.2, "learning_rate": 1.8605195209510935e-05, "loss": 1.2847, "step": 7142 }, { "epoch": 0.2, "learning_rate": 1.860474459243684e-05, "loss": 1.4209, "step": 7143 }, { "epoch": 0.2, "learning_rate": 1.8604293908043272e-05, "loss": 1.4434, "step": 7144 }, { "epoch": 0.2, "learning_rate": 1.8603843156333755e-05, "loss": 1.5029, "step": 7145 }, { "epoch": 0.2, "learning_rate": 1.8603392337311813e-05, "loss": 1.4233, "step": 7146 }, { "epoch": 0.2, "learning_rate": 1.8602941450980975e-05, "loss": 1.3198, "step": 7147 }, { "epoch": 0.2, "learning_rate": 1.860249049734477e-05, "loss": 1.3469, "step": 7148 }, { "epoch": 0.2, "learning_rate": 1.8602039476406724e-05, "loss": 1.4841, "step": 7149 }, { "epoch": 0.2, "learning_rate": 1.8601588388170367e-05, "loss": 1.3477, "step": 7150 }, { "epoch": 0.2, "learning_rate": 1.8601137232639224e-05, "loss": 1.3186, "step": 7151 }, { "epoch": 0.2, "learning_rate": 1.860068600981683e-05, "loss": 1.3293, "step": 7152 }, { "epoch": 0.2, "learning_rate": 1.8600234719706712e-05, "loss": 1.3516, "step": 7153 }, { "epoch": 0.2, "learning_rate": 1.85997833623124e-05, "loss": 1.2881, "step": 7154 }, { "epoch": 0.2, "learning_rate": 1.8599331937637434e-05, "loss": 1.4199, "step": 7155 }, { "epoch": 0.2, "learning_rate": 1.8598880445685333e-05, "loss": 1.3735, "step": 7156 }, { "epoch": 0.2, "learning_rate": 1.8598428886459635e-05, "loss": 1.4119, "step": 7157 }, { "epoch": 0.2, "learning_rate": 1.8597977259963872e-05, "loss": 1.2805, "step": 7158 }, { "epoch": 0.2, "learning_rate": 1.859752556620158e-05, "loss": 1.5952, "step": 7159 }, { "epoch": 0.2, "learning_rate": 1.859707380517629e-05, "loss": 1.292, "step": 7160 }, { "epoch": 0.2, "learning_rate": 1.859662197689154e-05, "loss": 1.3025, "step": 7161 }, { "epoch": 0.2, "learning_rate": 1.8596170081350858e-05, "loss": 1.4265, "step": 7162 }, { "epoch": 0.2, "learning_rate": 1.8595718118557783e-05, "loss": 1.4551, "step": 7163 }, { "epoch": 0.2, "learning_rate": 1.8595266088515856e-05, "loss": 1.3999, "step": 7164 }, { "epoch": 0.2, "learning_rate": 1.8594813991228603e-05, "loss": 1.335, "step": 7165 }, { "epoch": 0.2, "learning_rate": 1.8594361826699572e-05, "loss": 1.2957, "step": 7166 }, { "epoch": 0.2, "learning_rate": 1.8593909594932293e-05, "loss": 1.4941, "step": 7167 }, { "epoch": 0.2, "learning_rate": 1.859345729593031e-05, "loss": 1.8687, "step": 7168 }, { "epoch": 0.2, "learning_rate": 1.8593004929697153e-05, "loss": 1.4028, "step": 7169 }, { "epoch": 0.2, "learning_rate": 1.8592552496236367e-05, "loss": 1.3745, "step": 7170 }, { "epoch": 0.2, "learning_rate": 1.8592099995551492e-05, "loss": 1.334, "step": 7171 }, { "epoch": 0.2, "learning_rate": 1.8591647427646066e-05, "loss": 1.2437, "step": 7172 }, { "epoch": 0.2, "learning_rate": 1.8591194792523635e-05, "loss": 1.3767, "step": 7173 }, { "epoch": 0.2, "learning_rate": 1.859074209018773e-05, "loss": 1.3757, "step": 7174 }, { "epoch": 0.2, "learning_rate": 1.8590289320641904e-05, "loss": 1.4224, "step": 7175 }, { "epoch": 0.2, "learning_rate": 1.8589836483889687e-05, "loss": 1.4805, "step": 7176 }, { "epoch": 0.2, "learning_rate": 1.858938357993463e-05, "loss": 1.3652, "step": 7177 }, { "epoch": 0.2, "learning_rate": 1.8588930608780282e-05, "loss": 1.4351, "step": 7178 }, { "epoch": 0.2, "learning_rate": 1.858847757043017e-05, "loss": 1.353, "step": 7179 }, { "epoch": 0.2, "learning_rate": 1.8588024464887854e-05, "loss": 1.3335, "step": 7180 }, { "epoch": 0.2, "learning_rate": 1.8587571292156875e-05, "loss": 1.4106, "step": 7181 }, { "epoch": 0.2, "learning_rate": 1.8587118052240773e-05, "loss": 1.312, "step": 7182 }, { "epoch": 0.2, "learning_rate": 1.8586664745143098e-05, "loss": 1.2664, "step": 7183 }, { "epoch": 0.2, "learning_rate": 1.8586211370867394e-05, "loss": 1.4751, "step": 7184 }, { "epoch": 0.2, "learning_rate": 1.858575792941721e-05, "loss": 1.7446, "step": 7185 }, { "epoch": 0.2, "learning_rate": 1.8585304420796096e-05, "loss": 1.3901, "step": 7186 }, { "epoch": 0.2, "learning_rate": 1.8584850845007595e-05, "loss": 1.4236, "step": 7187 }, { "epoch": 0.2, "learning_rate": 1.858439720205526e-05, "loss": 1.3088, "step": 7188 }, { "epoch": 0.2, "learning_rate": 1.8583943491942635e-05, "loss": 1.5723, "step": 7189 }, { "epoch": 0.2, "learning_rate": 1.8583489714673274e-05, "loss": 1.3936, "step": 7190 }, { "epoch": 0.2, "learning_rate": 1.8583035870250724e-05, "loss": 1.1633, "step": 7191 }, { "epoch": 0.2, "learning_rate": 1.8582581958678543e-05, "loss": 1.3718, "step": 7192 }, { "epoch": 0.2, "learning_rate": 1.858212797996027e-05, "loss": 1.186, "step": 7193 }, { "epoch": 0.2, "learning_rate": 1.8581673934099465e-05, "loss": 1.7471, "step": 7194 }, { "epoch": 0.2, "learning_rate": 1.8581219821099685e-05, "loss": 1.3901, "step": 7195 }, { "epoch": 0.2, "learning_rate": 1.8580765640964466e-05, "loss": 1.437, "step": 7196 }, { "epoch": 0.2, "learning_rate": 1.8580311393697376e-05, "loss": 1.4551, "step": 7197 }, { "epoch": 0.2, "learning_rate": 1.8579857079301966e-05, "loss": 1.3105, "step": 7198 }, { "epoch": 0.2, "learning_rate": 1.8579402697781787e-05, "loss": 1.271, "step": 7199 }, { "epoch": 0.2, "learning_rate": 1.8578948249140397e-05, "loss": 1.3425, "step": 7200 }, { "epoch": 0.2, "learning_rate": 1.8578493733381352e-05, "loss": 1.3538, "step": 7201 }, { "epoch": 0.2, "learning_rate": 1.85780391505082e-05, "loss": 1.3801, "step": 7202 }, { "epoch": 0.2, "learning_rate": 1.8577584500524507e-05, "loss": 1.2383, "step": 7203 }, { "epoch": 0.2, "learning_rate": 1.857712978343383e-05, "loss": 1.2273, "step": 7204 }, { "epoch": 0.2, "learning_rate": 1.8576674999239713e-05, "loss": 1.3809, "step": 7205 }, { "epoch": 0.2, "learning_rate": 1.857622014794573e-05, "loss": 1.4817, "step": 7206 }, { "epoch": 0.2, "learning_rate": 1.8575765229555433e-05, "loss": 1.3989, "step": 7207 }, { "epoch": 0.2, "learning_rate": 1.8575310244072383e-05, "loss": 1.3704, "step": 7208 }, { "epoch": 0.2, "learning_rate": 1.8574855191500134e-05, "loss": 1.4165, "step": 7209 }, { "epoch": 0.2, "learning_rate": 1.8574400071842254e-05, "loss": 1.4741, "step": 7210 }, { "epoch": 0.2, "learning_rate": 1.85739448851023e-05, "loss": 1.5154, "step": 7211 }, { "epoch": 0.2, "learning_rate": 1.857348963128383e-05, "loss": 1.4043, "step": 7212 }, { "epoch": 0.2, "learning_rate": 1.857303431039041e-05, "loss": 1.4309, "step": 7213 }, { "epoch": 0.2, "learning_rate": 1.85725789224256e-05, "loss": 1.22, "step": 7214 }, { "epoch": 0.2, "learning_rate": 1.8572123467392964e-05, "loss": 1.2585, "step": 7215 }, { "epoch": 0.2, "learning_rate": 1.8571667945296067e-05, "loss": 1.3152, "step": 7216 }, { "epoch": 0.2, "learning_rate": 1.8571212356138468e-05, "loss": 1.4448, "step": 7217 }, { "epoch": 0.2, "learning_rate": 1.8570756699923733e-05, "loss": 1.7852, "step": 7218 }, { "epoch": 0.2, "learning_rate": 1.8570300976655433e-05, "loss": 1.2722, "step": 7219 }, { "epoch": 0.2, "learning_rate": 1.8569845186337124e-05, "loss": 1.4502, "step": 7220 }, { "epoch": 0.2, "learning_rate": 1.856938932897238e-05, "loss": 1.4097, "step": 7221 }, { "epoch": 0.2, "learning_rate": 1.8568933404564757e-05, "loss": 1.4006, "step": 7222 }, { "epoch": 0.2, "learning_rate": 1.8568477413117834e-05, "loss": 1.4341, "step": 7223 }, { "epoch": 0.2, "learning_rate": 1.856802135463517e-05, "loss": 1.3459, "step": 7224 }, { "epoch": 0.2, "learning_rate": 1.8567565229120338e-05, "loss": 1.4558, "step": 7225 }, { "epoch": 0.2, "learning_rate": 1.8567109036576904e-05, "loss": 1.3093, "step": 7226 }, { "epoch": 0.2, "learning_rate": 1.8566652777008434e-05, "loss": 1.4487, "step": 7227 }, { "epoch": 0.2, "learning_rate": 1.8566196450418502e-05, "loss": 1.3403, "step": 7228 }, { "epoch": 0.2, "learning_rate": 1.856574005681068e-05, "loss": 1.4517, "step": 7229 }, { "epoch": 0.2, "learning_rate": 1.8565283596188534e-05, "loss": 1.4788, "step": 7230 }, { "epoch": 0.2, "learning_rate": 1.8564827068555638e-05, "loss": 1.4319, "step": 7231 }, { "epoch": 0.2, "learning_rate": 1.8564370473915563e-05, "loss": 1.4031, "step": 7232 }, { "epoch": 0.2, "learning_rate": 1.8563913812271876e-05, "loss": 1.3867, "step": 7233 }, { "epoch": 0.2, "learning_rate": 1.856345708362816e-05, "loss": 1.4771, "step": 7234 }, { "epoch": 0.2, "learning_rate": 1.856300028798798e-05, "loss": 1.3638, "step": 7235 }, { "epoch": 0.2, "learning_rate": 1.8562543425354913e-05, "loss": 1.4414, "step": 7236 }, { "epoch": 0.2, "learning_rate": 1.8562086495732532e-05, "loss": 1.3503, "step": 7237 }, { "epoch": 0.2, "learning_rate": 1.856162949912441e-05, "loss": 1.4292, "step": 7238 }, { "epoch": 0.2, "learning_rate": 1.856117243553413e-05, "loss": 1.4634, "step": 7239 }, { "epoch": 0.2, "learning_rate": 1.856071530496526e-05, "loss": 1.2944, "step": 7240 }, { "epoch": 0.2, "learning_rate": 1.856025810742138e-05, "loss": 1.4492, "step": 7241 }, { "epoch": 0.2, "learning_rate": 1.8559800842906065e-05, "loss": 1.2822, "step": 7242 }, { "epoch": 0.2, "learning_rate": 1.8559343511422893e-05, "loss": 1.3135, "step": 7243 }, { "epoch": 0.2, "learning_rate": 1.8558886112975446e-05, "loss": 1.374, "step": 7244 }, { "epoch": 0.2, "learning_rate": 1.855842864756729e-05, "loss": 1.4011, "step": 7245 }, { "epoch": 0.2, "learning_rate": 1.8557971115202022e-05, "loss": 1.3347, "step": 7246 }, { "epoch": 0.2, "learning_rate": 1.8557513515883206e-05, "loss": 1.5596, "step": 7247 }, { "epoch": 0.2, "learning_rate": 1.8557055849614432e-05, "loss": 1.457, "step": 7248 }, { "epoch": 0.2, "learning_rate": 1.8556598116399277e-05, "loss": 1.4202, "step": 7249 }, { "epoch": 0.2, "learning_rate": 1.855614031624132e-05, "loss": 1.3752, "step": 7250 }, { "epoch": 0.2, "learning_rate": 1.8555682449144143e-05, "loss": 1.4551, "step": 7251 }, { "epoch": 0.2, "learning_rate": 1.855522451511133e-05, "loss": 1.5059, "step": 7252 }, { "epoch": 0.2, "learning_rate": 1.8554766514146466e-05, "loss": 1.4114, "step": 7253 }, { "epoch": 0.2, "learning_rate": 1.855430844625313e-05, "loss": 1.4973, "step": 7254 }, { "epoch": 0.2, "learning_rate": 1.8553850311434908e-05, "loss": 1.3574, "step": 7255 }, { "epoch": 0.2, "learning_rate": 1.8553392109695384e-05, "loss": 1.666, "step": 7256 }, { "epoch": 0.2, "learning_rate": 1.855293384103814e-05, "loss": 1.396, "step": 7257 }, { "epoch": 0.2, "learning_rate": 1.8552475505466766e-05, "loss": 1.4663, "step": 7258 }, { "epoch": 0.2, "learning_rate": 1.8552017102984842e-05, "loss": 1.3452, "step": 7259 }, { "epoch": 0.2, "learning_rate": 1.8551558633595964e-05, "loss": 1.5156, "step": 7260 }, { "epoch": 0.2, "learning_rate": 1.8551100097303705e-05, "loss": 1.2156, "step": 7261 }, { "epoch": 0.2, "learning_rate": 1.8550641494111663e-05, "loss": 1.4653, "step": 7262 }, { "epoch": 0.2, "learning_rate": 1.8550182824023424e-05, "loss": 1.5073, "step": 7263 }, { "epoch": 0.2, "learning_rate": 1.8549724087042575e-05, "loss": 1.3794, "step": 7264 }, { "epoch": 0.2, "learning_rate": 1.8549265283172702e-05, "loss": 1.2676, "step": 7265 }, { "epoch": 0.2, "learning_rate": 1.85488064124174e-05, "loss": 1.4004, "step": 7266 }, { "epoch": 0.2, "learning_rate": 1.8548347474780258e-05, "loss": 1.4995, "step": 7267 }, { "epoch": 0.2, "learning_rate": 1.8547888470264862e-05, "loss": 1.3774, "step": 7268 }, { "epoch": 0.2, "learning_rate": 1.854742939887481e-05, "loss": 1.1785, "step": 7269 }, { "epoch": 0.2, "learning_rate": 1.8546970260613683e-05, "loss": 1.3152, "step": 7270 }, { "epoch": 0.2, "learning_rate": 1.8546511055485082e-05, "loss": 1.4102, "step": 7271 }, { "epoch": 0.2, "learning_rate": 1.8546051783492602e-05, "loss": 1.2944, "step": 7272 }, { "epoch": 0.2, "learning_rate": 1.8545592444639828e-05, "loss": 1.3132, "step": 7273 }, { "epoch": 0.2, "learning_rate": 1.854513303893036e-05, "loss": 1.2227, "step": 7274 }, { "epoch": 0.2, "learning_rate": 1.8544673566367786e-05, "loss": 1.428, "step": 7275 }, { "epoch": 0.2, "learning_rate": 1.8544214026955705e-05, "loss": 1.3621, "step": 7276 }, { "epoch": 0.2, "learning_rate": 1.854375442069771e-05, "loss": 1.4387, "step": 7277 }, { "epoch": 0.2, "learning_rate": 1.85432947475974e-05, "loss": 1.3219, "step": 7278 }, { "epoch": 0.2, "learning_rate": 1.8542835007658368e-05, "loss": 1.3215, "step": 7279 }, { "epoch": 0.2, "learning_rate": 1.8542375200884213e-05, "loss": 1.3167, "step": 7280 }, { "epoch": 0.2, "learning_rate": 1.8541915327278532e-05, "loss": 1.436, "step": 7281 }, { "epoch": 0.2, "learning_rate": 1.8541455386844923e-05, "loss": 1.3816, "step": 7282 }, { "epoch": 0.2, "learning_rate": 1.854099537958698e-05, "loss": 1.3684, "step": 7283 }, { "epoch": 0.2, "learning_rate": 1.8540535305508306e-05, "loss": 1.335, "step": 7284 }, { "epoch": 0.2, "learning_rate": 1.8540075164612502e-05, "loss": 1.3865, "step": 7285 }, { "epoch": 0.2, "learning_rate": 1.8539614956903166e-05, "loss": 1.501, "step": 7286 }, { "epoch": 0.2, "learning_rate": 1.8539154682383892e-05, "loss": 1.356, "step": 7287 }, { "epoch": 0.2, "learning_rate": 1.8538694341058293e-05, "loss": 1.3152, "step": 7288 }, { "epoch": 0.2, "learning_rate": 1.8538233932929964e-05, "loss": 1.3438, "step": 7289 }, { "epoch": 0.2, "learning_rate": 1.853777345800251e-05, "loss": 1.4419, "step": 7290 }, { "epoch": 0.2, "learning_rate": 1.8537312916279526e-05, "loss": 1.4104, "step": 7291 }, { "epoch": 0.2, "learning_rate": 1.8536852307764625e-05, "loss": 1.3936, "step": 7292 }, { "epoch": 0.2, "learning_rate": 1.8536391632461402e-05, "loss": 1.3916, "step": 7293 }, { "epoch": 0.2, "learning_rate": 1.8535930890373467e-05, "loss": 1.375, "step": 7294 }, { "epoch": 0.2, "learning_rate": 1.853547008150442e-05, "loss": 1.5874, "step": 7295 }, { "epoch": 0.2, "learning_rate": 1.8535009205857872e-05, "loss": 1.4907, "step": 7296 }, { "epoch": 0.2, "learning_rate": 1.8534548263437426e-05, "loss": 1.47, "step": 7297 }, { "epoch": 0.2, "learning_rate": 1.8534087254246684e-05, "loss": 1.4299, "step": 7298 }, { "epoch": 0.2, "learning_rate": 1.853362617828926e-05, "loss": 1.2639, "step": 7299 }, { "epoch": 0.2, "learning_rate": 1.8533165035568755e-05, "loss": 1.4502, "step": 7300 }, { "epoch": 0.2, "learning_rate": 1.8532703826088778e-05, "loss": 1.4326, "step": 7301 }, { "epoch": 0.2, "learning_rate": 1.8532242549852942e-05, "loss": 1.4641, "step": 7302 }, { "epoch": 0.2, "learning_rate": 1.8531781206864852e-05, "loss": 1.3792, "step": 7303 }, { "epoch": 0.2, "learning_rate": 1.853131979712812e-05, "loss": 1.3689, "step": 7304 }, { "epoch": 0.2, "learning_rate": 1.853085832064635e-05, "loss": 1.5098, "step": 7305 }, { "epoch": 0.2, "learning_rate": 1.8530396777423153e-05, "loss": 1.4644, "step": 7306 }, { "epoch": 0.2, "learning_rate": 1.8529935167462147e-05, "loss": 1.47, "step": 7307 }, { "epoch": 0.2, "learning_rate": 1.8529473490766938e-05, "loss": 1.4707, "step": 7308 }, { "epoch": 0.2, "learning_rate": 1.8529011747341142e-05, "loss": 1.4478, "step": 7309 }, { "epoch": 0.2, "learning_rate": 1.8528549937188364e-05, "loss": 1.5024, "step": 7310 }, { "epoch": 0.2, "learning_rate": 1.8528088060312226e-05, "loss": 1.4658, "step": 7311 }, { "epoch": 0.2, "learning_rate": 1.8527626116716335e-05, "loss": 1.3696, "step": 7312 }, { "epoch": 0.2, "learning_rate": 1.852716410640431e-05, "loss": 1.3774, "step": 7313 }, { "epoch": 0.2, "learning_rate": 1.8526702029379757e-05, "loss": 1.2434, "step": 7314 }, { "epoch": 0.2, "learning_rate": 1.8526239885646302e-05, "loss": 1.3859, "step": 7315 }, { "epoch": 0.2, "learning_rate": 1.8525777675207552e-05, "loss": 1.4565, "step": 7316 }, { "epoch": 0.2, "learning_rate": 1.8525315398067133e-05, "loss": 1.4148, "step": 7317 }, { "epoch": 0.2, "learning_rate": 1.852485305422865e-05, "loss": 1.3945, "step": 7318 }, { "epoch": 0.2, "learning_rate": 1.8524390643695723e-05, "loss": 1.4243, "step": 7319 }, { "epoch": 0.2, "learning_rate": 1.8523928166471977e-05, "loss": 1.8223, "step": 7320 }, { "epoch": 0.2, "learning_rate": 1.8523465622561024e-05, "loss": 1.3101, "step": 7321 }, { "epoch": 0.2, "learning_rate": 1.8523003011966482e-05, "loss": 1.3201, "step": 7322 }, { "epoch": 0.2, "learning_rate": 1.8522540334691974e-05, "loss": 1.3999, "step": 7323 }, { "epoch": 0.2, "learning_rate": 1.8522077590741117e-05, "loss": 1.4873, "step": 7324 }, { "epoch": 0.2, "learning_rate": 1.852161478011753e-05, "loss": 1.2192, "step": 7325 }, { "epoch": 0.2, "learning_rate": 1.852115190282484e-05, "loss": 1.4082, "step": 7326 }, { "epoch": 0.2, "learning_rate": 1.8520688958866668e-05, "loss": 1.3511, "step": 7327 }, { "epoch": 0.2, "learning_rate": 1.8520225948246623e-05, "loss": 1.3569, "step": 7328 }, { "epoch": 0.2, "learning_rate": 1.8519762870968344e-05, "loss": 1.1533, "step": 7329 }, { "epoch": 0.2, "learning_rate": 1.8519299727035444e-05, "loss": 1.5, "step": 7330 }, { "epoch": 0.2, "learning_rate": 1.8518836516451548e-05, "loss": 1.4033, "step": 7331 }, { "epoch": 0.2, "learning_rate": 1.8518373239220283e-05, "loss": 1.4648, "step": 7332 }, { "epoch": 0.2, "learning_rate": 1.851790989534527e-05, "loss": 1.3833, "step": 7333 }, { "epoch": 0.2, "learning_rate": 1.851744648483014e-05, "loss": 1.271, "step": 7334 }, { "epoch": 0.2, "learning_rate": 1.8516983007678505e-05, "loss": 1.446, "step": 7335 }, { "epoch": 0.2, "learning_rate": 1.8516519463894006e-05, "loss": 1.3528, "step": 7336 }, { "epoch": 0.2, "learning_rate": 1.851605585348026e-05, "loss": 1.5327, "step": 7337 }, { "epoch": 0.2, "learning_rate": 1.85155921764409e-05, "loss": 1.2517, "step": 7338 }, { "epoch": 0.2, "learning_rate": 1.8515128432779553e-05, "loss": 1.4653, "step": 7339 }, { "epoch": 0.2, "learning_rate": 1.851466462249984e-05, "loss": 1.2444, "step": 7340 }, { "epoch": 0.2, "learning_rate": 1.8514200745605397e-05, "loss": 1.4351, "step": 7341 }, { "epoch": 0.2, "learning_rate": 1.8513736802099852e-05, "loss": 1.3865, "step": 7342 }, { "epoch": 0.2, "learning_rate": 1.8513272791986835e-05, "loss": 1.2639, "step": 7343 }, { "epoch": 0.2, "learning_rate": 1.8512808715269974e-05, "loss": 1.4077, "step": 7344 }, { "epoch": 0.2, "learning_rate": 1.85123445719529e-05, "loss": 1.4612, "step": 7345 }, { "epoch": 0.2, "learning_rate": 1.8511880362039246e-05, "loss": 1.311, "step": 7346 }, { "epoch": 0.2, "learning_rate": 1.8511416085532642e-05, "loss": 1.4536, "step": 7347 }, { "epoch": 0.2, "learning_rate": 1.8510951742436717e-05, "loss": 1.386, "step": 7348 }, { "epoch": 0.2, "learning_rate": 1.851048733275511e-05, "loss": 1.3984, "step": 7349 }, { "epoch": 0.2, "learning_rate": 1.8510022856491457e-05, "loss": 1.5093, "step": 7350 }, { "epoch": 0.2, "learning_rate": 1.8509558313649383e-05, "loss": 1.4021, "step": 7351 }, { "epoch": 0.2, "learning_rate": 1.8509093704232523e-05, "loss": 1.4985, "step": 7352 }, { "epoch": 0.2, "learning_rate": 1.850862902824452e-05, "loss": 1.2566, "step": 7353 }, { "epoch": 0.2, "learning_rate": 1.8508164285689002e-05, "loss": 1.4321, "step": 7354 }, { "epoch": 0.2, "learning_rate": 1.8507699476569606e-05, "loss": 1.4155, "step": 7355 }, { "epoch": 0.2, "learning_rate": 1.8507234600889975e-05, "loss": 1.9126, "step": 7356 }, { "epoch": 0.2, "learning_rate": 1.8506769658653737e-05, "loss": 1.3928, "step": 7357 }, { "epoch": 0.2, "learning_rate": 1.8506304649864535e-05, "loss": 1.2396, "step": 7358 }, { "epoch": 0.2, "learning_rate": 1.8505839574526004e-05, "loss": 1.3733, "step": 7359 }, { "epoch": 0.2, "learning_rate": 1.8505374432641786e-05, "loss": 1.4253, "step": 7360 }, { "epoch": 0.2, "learning_rate": 1.8504909224215514e-05, "loss": 1.4153, "step": 7361 }, { "epoch": 0.2, "learning_rate": 1.8504443949250833e-05, "loss": 1.3962, "step": 7362 }, { "epoch": 0.2, "learning_rate": 1.8503978607751385e-05, "loss": 1.4609, "step": 7363 }, { "epoch": 0.2, "learning_rate": 1.8503513199720803e-05, "loss": 1.4036, "step": 7364 }, { "epoch": 0.2, "learning_rate": 1.850304772516274e-05, "loss": 1.4629, "step": 7365 }, { "epoch": 0.2, "learning_rate": 1.850258218408082e-05, "loss": 1.4224, "step": 7366 }, { "epoch": 0.2, "learning_rate": 1.85021165764787e-05, "loss": 1.2878, "step": 7367 }, { "epoch": 0.2, "learning_rate": 1.8501650902360017e-05, "loss": 1.2793, "step": 7368 }, { "epoch": 0.2, "learning_rate": 1.8501185161728416e-05, "loss": 1.2234, "step": 7369 }, { "epoch": 0.2, "learning_rate": 1.850071935458754e-05, "loss": 1.4727, "step": 7370 }, { "epoch": 0.2, "learning_rate": 1.850025348094103e-05, "loss": 1.2893, "step": 7371 }, { "epoch": 0.2, "learning_rate": 1.849978754079254e-05, "loss": 1.3877, "step": 7372 }, { "epoch": 0.2, "learning_rate": 1.8499321534145704e-05, "loss": 1.3882, "step": 7373 }, { "epoch": 0.2, "learning_rate": 1.8498855461004173e-05, "loss": 1.293, "step": 7374 }, { "epoch": 0.2, "learning_rate": 1.8498389321371597e-05, "loss": 1.458, "step": 7375 }, { "epoch": 0.2, "learning_rate": 1.8497923115251617e-05, "loss": 1.3716, "step": 7376 }, { "epoch": 0.2, "learning_rate": 1.849745684264788e-05, "loss": 1.4333, "step": 7377 }, { "epoch": 0.2, "learning_rate": 1.849699050356404e-05, "loss": 1.3792, "step": 7378 }, { "epoch": 0.2, "learning_rate": 1.8496524098003742e-05, "loss": 1.4043, "step": 7379 }, { "epoch": 0.2, "learning_rate": 1.8496057625970633e-05, "loss": 1.3857, "step": 7380 }, { "epoch": 0.2, "learning_rate": 1.8495591087468364e-05, "loss": 1.4565, "step": 7381 }, { "epoch": 0.2, "learning_rate": 1.8495124482500586e-05, "loss": 1.4387, "step": 7382 }, { "epoch": 0.2, "learning_rate": 1.8494657811070947e-05, "loss": 1.2933, "step": 7383 }, { "epoch": 0.2, "learning_rate": 1.8494191073183103e-05, "loss": 1.4299, "step": 7384 }, { "epoch": 0.2, "learning_rate": 1.84937242688407e-05, "loss": 1.2695, "step": 7385 }, { "epoch": 0.2, "learning_rate": 1.8493257398047393e-05, "loss": 1.5142, "step": 7386 }, { "epoch": 0.2, "learning_rate": 1.8492790460806834e-05, "loss": 1.4204, "step": 7387 }, { "epoch": 0.2, "learning_rate": 1.8492323457122677e-05, "loss": 1.3933, "step": 7388 }, { "epoch": 0.2, "learning_rate": 1.8491856386998574e-05, "loss": 1.4409, "step": 7389 }, { "epoch": 0.2, "learning_rate": 1.849138925043818e-05, "loss": 1.4011, "step": 7390 }, { "epoch": 0.2, "learning_rate": 1.849092204744515e-05, "loss": 1.3601, "step": 7391 }, { "epoch": 0.2, "learning_rate": 1.8490454778023136e-05, "loss": 1.3535, "step": 7392 }, { "epoch": 0.2, "learning_rate": 1.8489987442175798e-05, "loss": 1.4258, "step": 7393 }, { "epoch": 0.2, "learning_rate": 1.8489520039906793e-05, "loss": 1.1863, "step": 7394 }, { "epoch": 0.2, "learning_rate": 1.848905257121977e-05, "loss": 1.5103, "step": 7395 }, { "epoch": 0.2, "learning_rate": 1.8488585036118393e-05, "loss": 1.8276, "step": 7396 }, { "epoch": 0.2, "learning_rate": 1.848811743460632e-05, "loss": 1.4204, "step": 7397 }, { "epoch": 0.2, "learning_rate": 1.8487649766687206e-05, "loss": 1.4634, "step": 7398 }, { "epoch": 0.2, "learning_rate": 1.8487182032364714e-05, "loss": 1.3757, "step": 7399 }, { "epoch": 0.2, "learning_rate": 1.84867142316425e-05, "loss": 1.3325, "step": 7400 }, { "epoch": 0.2, "learning_rate": 1.8486246364524225e-05, "loss": 1.292, "step": 7401 }, { "epoch": 0.2, "learning_rate": 1.8485778431013547e-05, "loss": 1.5039, "step": 7402 }, { "epoch": 0.2, "learning_rate": 1.848531043111413e-05, "loss": 1.4229, "step": 7403 }, { "epoch": 0.2, "learning_rate": 1.8484842364829634e-05, "loss": 1.2827, "step": 7404 }, { "epoch": 0.2, "learning_rate": 1.848437423216372e-05, "loss": 1.4717, "step": 7405 }, { "epoch": 0.2, "learning_rate": 1.8483906033120053e-05, "loss": 1.3032, "step": 7406 }, { "epoch": 0.2, "learning_rate": 1.8483437767702296e-05, "loss": 1.4081, "step": 7407 }, { "epoch": 0.2, "learning_rate": 1.848296943591411e-05, "loss": 1.4121, "step": 7408 }, { "epoch": 0.2, "learning_rate": 1.8482501037759157e-05, "loss": 1.4436, "step": 7409 }, { "epoch": 0.2, "learning_rate": 1.848203257324111e-05, "loss": 1.3701, "step": 7410 }, { "epoch": 0.2, "learning_rate": 1.8481564042363622e-05, "loss": 1.5347, "step": 7411 }, { "epoch": 0.2, "learning_rate": 1.848109544513037e-05, "loss": 1.4424, "step": 7412 }, { "epoch": 0.2, "learning_rate": 1.8480626781545013e-05, "loss": 1.46, "step": 7413 }, { "epoch": 0.2, "learning_rate": 1.8480158051611223e-05, "loss": 1.3992, "step": 7414 }, { "epoch": 0.2, "learning_rate": 1.8479689255332666e-05, "loss": 1.3284, "step": 7415 }, { "epoch": 0.2, "learning_rate": 1.8479220392713e-05, "loss": 1.2754, "step": 7416 }, { "epoch": 0.2, "learning_rate": 1.8478751463755905e-05, "loss": 1.4783, "step": 7417 }, { "epoch": 0.2, "learning_rate": 1.8478282468465046e-05, "loss": 1.4292, "step": 7418 }, { "epoch": 0.2, "learning_rate": 1.847781340684409e-05, "loss": 1.5522, "step": 7419 }, { "epoch": 0.2, "learning_rate": 1.8477344278896708e-05, "loss": 1.2664, "step": 7420 }, { "epoch": 0.2, "learning_rate": 1.8476875084626575e-05, "loss": 1.4478, "step": 7421 }, { "epoch": 0.2, "learning_rate": 1.8476405824037356e-05, "loss": 1.363, "step": 7422 }, { "epoch": 0.2, "learning_rate": 1.847593649713272e-05, "loss": 1.2568, "step": 7423 }, { "epoch": 0.2, "learning_rate": 1.8475467103916346e-05, "loss": 1.4575, "step": 7424 }, { "epoch": 0.2, "learning_rate": 1.8474997644391902e-05, "loss": 1.3206, "step": 7425 }, { "epoch": 0.2, "learning_rate": 1.847452811856306e-05, "loss": 1.2366, "step": 7426 }, { "epoch": 0.2, "learning_rate": 1.84740585264335e-05, "loss": 1.4248, "step": 7427 }, { "epoch": 0.2, "learning_rate": 1.8473588868006885e-05, "loss": 1.4634, "step": 7428 }, { "epoch": 0.2, "learning_rate": 1.84731191432869e-05, "loss": 1.4697, "step": 7429 }, { "epoch": 0.2, "learning_rate": 1.8472649352277212e-05, "loss": 1.2678, "step": 7430 }, { "epoch": 0.2, "learning_rate": 1.84721794949815e-05, "loss": 1.4263, "step": 7431 }, { "epoch": 0.2, "learning_rate": 1.847170957140344e-05, "loss": 1.2637, "step": 7432 }, { "epoch": 0.2, "learning_rate": 1.8471239581546706e-05, "loss": 1.5298, "step": 7433 }, { "epoch": 0.2, "learning_rate": 1.847076952541498e-05, "loss": 1.3501, "step": 7434 }, { "epoch": 0.2, "learning_rate": 1.8470299403011936e-05, "loss": 1.4253, "step": 7435 }, { "epoch": 0.2, "learning_rate": 1.8469829214341254e-05, "loss": 1.6216, "step": 7436 }, { "epoch": 0.2, "learning_rate": 1.8469358959406608e-05, "loss": 1.3682, "step": 7437 }, { "epoch": 0.2, "learning_rate": 1.8468888638211678e-05, "loss": 1.2156, "step": 7438 }, { "epoch": 0.2, "learning_rate": 1.846841825076015e-05, "loss": 1.2034, "step": 7439 }, { "epoch": 0.2, "learning_rate": 1.8467947797055698e-05, "loss": 1.4409, "step": 7440 }, { "epoch": 0.2, "learning_rate": 1.8467477277102003e-05, "loss": 1.3662, "step": 7441 }, { "epoch": 0.2, "learning_rate": 1.846700669090275e-05, "loss": 1.3809, "step": 7442 }, { "epoch": 0.2, "learning_rate": 1.846653603846162e-05, "loss": 1.4995, "step": 7443 }, { "epoch": 0.2, "learning_rate": 1.846606531978229e-05, "loss": 1.332, "step": 7444 }, { "epoch": 0.2, "learning_rate": 1.8465594534868447e-05, "loss": 1.5466, "step": 7445 }, { "epoch": 0.2, "learning_rate": 1.8465123683723772e-05, "loss": 1.4277, "step": 7446 }, { "epoch": 0.2, "learning_rate": 1.8464652766351953e-05, "loss": 1.5383, "step": 7447 }, { "epoch": 0.2, "learning_rate": 1.846418178275667e-05, "loss": 1.415, "step": 7448 }, { "epoch": 0.2, "learning_rate": 1.8463710732941602e-05, "loss": 1.4937, "step": 7449 }, { "epoch": 0.2, "learning_rate": 1.8463239616910446e-05, "loss": 1.7144, "step": 7450 }, { "epoch": 0.2, "learning_rate": 1.8462768434666888e-05, "loss": 1.3923, "step": 7451 }, { "epoch": 0.2, "learning_rate": 1.8462297186214603e-05, "loss": 1.1768, "step": 7452 }, { "epoch": 0.2, "learning_rate": 1.8461825871557284e-05, "loss": 1.4475, "step": 7453 }, { "epoch": 0.2, "learning_rate": 1.846135449069862e-05, "loss": 1.4482, "step": 7454 }, { "epoch": 0.2, "learning_rate": 1.84608830436423e-05, "loss": 1.3313, "step": 7455 }, { "epoch": 0.2, "learning_rate": 1.8460411530392005e-05, "loss": 1.4275, "step": 7456 }, { "epoch": 0.2, "learning_rate": 1.8459939950951434e-05, "loss": 1.7573, "step": 7457 }, { "epoch": 0.2, "learning_rate": 1.8459468305324265e-05, "loss": 1.4741, "step": 7458 }, { "epoch": 0.2, "learning_rate": 1.8458996593514197e-05, "loss": 1.3235, "step": 7459 }, { "epoch": 0.2, "learning_rate": 1.8458524815524916e-05, "loss": 1.3687, "step": 7460 }, { "epoch": 0.2, "learning_rate": 1.845805297136012e-05, "loss": 1.4385, "step": 7461 }, { "epoch": 0.2, "learning_rate": 1.8457581061023488e-05, "loss": 1.5293, "step": 7462 }, { "epoch": 0.2, "learning_rate": 1.845710908451872e-05, "loss": 1.4956, "step": 7463 }, { "epoch": 0.2, "learning_rate": 1.845663704184951e-05, "loss": 1.3667, "step": 7464 }, { "epoch": 0.2, "learning_rate": 1.8456164933019544e-05, "loss": 1.3459, "step": 7465 }, { "epoch": 0.2, "learning_rate": 1.8455692758032524e-05, "loss": 1.356, "step": 7466 }, { "epoch": 0.2, "learning_rate": 1.845522051689214e-05, "loss": 1.3245, "step": 7467 }, { "epoch": 0.2, "learning_rate": 1.8454748209602083e-05, "loss": 1.4463, "step": 7468 }, { "epoch": 0.2, "learning_rate": 1.8454275836166052e-05, "loss": 1.2507, "step": 7469 }, { "epoch": 0.2, "learning_rate": 1.8453803396587745e-05, "loss": 1.7632, "step": 7470 }, { "epoch": 0.2, "learning_rate": 1.8453330890870857e-05, "loss": 1.4238, "step": 7471 }, { "epoch": 0.2, "learning_rate": 1.845285831901908e-05, "loss": 1.2739, "step": 7472 }, { "epoch": 0.2, "learning_rate": 1.8452385681036115e-05, "loss": 1.2407, "step": 7473 }, { "epoch": 0.2, "learning_rate": 1.845191297692566e-05, "loss": 1.4202, "step": 7474 }, { "epoch": 0.2, "learning_rate": 1.845144020669141e-05, "loss": 1.3594, "step": 7475 }, { "epoch": 0.2, "learning_rate": 1.845096737033707e-05, "loss": 1.4048, "step": 7476 }, { "epoch": 0.2, "learning_rate": 1.8450494467866332e-05, "loss": 1.4082, "step": 7477 }, { "epoch": 0.2, "learning_rate": 1.84500214992829e-05, "loss": 1.3408, "step": 7478 }, { "epoch": 0.2, "learning_rate": 1.844954846459047e-05, "loss": 1.3477, "step": 7479 }, { "epoch": 0.2, "learning_rate": 1.844907536379275e-05, "loss": 1.3318, "step": 7480 }, { "epoch": 0.2, "learning_rate": 1.8448602196893436e-05, "loss": 1.3635, "step": 7481 }, { "epoch": 0.2, "learning_rate": 1.8448128963896233e-05, "loss": 1.2749, "step": 7482 }, { "epoch": 0.2, "learning_rate": 1.844765566480484e-05, "loss": 1.3455, "step": 7483 }, { "epoch": 0.2, "learning_rate": 1.8447182299622963e-05, "loss": 1.2808, "step": 7484 }, { "epoch": 0.2, "learning_rate": 1.84467088683543e-05, "loss": 1.458, "step": 7485 }, { "epoch": 0.2, "learning_rate": 1.8446235371002564e-05, "loss": 1.4355, "step": 7486 }, { "epoch": 0.2, "learning_rate": 1.844576180757145e-05, "loss": 1.4546, "step": 7487 }, { "epoch": 0.2, "learning_rate": 1.8445288178064667e-05, "loss": 1.3616, "step": 7488 }, { "epoch": 0.2, "learning_rate": 1.8444814482485923e-05, "loss": 1.2126, "step": 7489 }, { "epoch": 0.2, "learning_rate": 1.844434072083892e-05, "loss": 1.5234, "step": 7490 }, { "epoch": 0.2, "learning_rate": 1.8443866893127367e-05, "loss": 1.8511, "step": 7491 }, { "epoch": 0.2, "learning_rate": 1.844339299935497e-05, "loss": 1.5034, "step": 7492 }, { "epoch": 0.2, "learning_rate": 1.8442919039525435e-05, "loss": 1.5142, "step": 7493 }, { "epoch": 0.2, "learning_rate": 1.8442445013642473e-05, "loss": 1.4011, "step": 7494 }, { "epoch": 0.2, "learning_rate": 1.844197092170979e-05, "loss": 1.4226, "step": 7495 }, { "epoch": 0.2, "learning_rate": 1.8441496763731098e-05, "loss": 1.4443, "step": 7496 }, { "epoch": 0.2, "learning_rate": 1.8441022539710104e-05, "loss": 1.418, "step": 7497 }, { "epoch": 0.2, "learning_rate": 1.844054824965052e-05, "loss": 1.3042, "step": 7498 }, { "epoch": 0.2, "learning_rate": 1.844007389355605e-05, "loss": 1.3772, "step": 7499 }, { "epoch": 0.2, "learning_rate": 1.843959947143042e-05, "loss": 1.5171, "step": 7500 }, { "epoch": 0.2, "learning_rate": 1.8439124983277326e-05, "loss": 1.2605, "step": 7501 }, { "epoch": 0.2, "learning_rate": 1.8438650429100488e-05, "loss": 1.3213, "step": 7502 }, { "epoch": 0.2, "learning_rate": 1.8438175808903614e-05, "loss": 1.4275, "step": 7503 }, { "epoch": 0.2, "learning_rate": 1.8437701122690423e-05, "loss": 1.3484, "step": 7504 }, { "epoch": 0.2, "learning_rate": 1.843722637046463e-05, "loss": 1.3376, "step": 7505 }, { "epoch": 0.2, "learning_rate": 1.843675155222994e-05, "loss": 1.7585, "step": 7506 }, { "epoch": 0.21, "learning_rate": 1.8436276667990073e-05, "loss": 1.385, "step": 7507 }, { "epoch": 0.21, "learning_rate": 1.8435801717748747e-05, "loss": 1.4299, "step": 7508 }, { "epoch": 0.21, "learning_rate": 1.8435326701509675e-05, "loss": 1.7642, "step": 7509 }, { "epoch": 0.21, "learning_rate": 1.843485161927657e-05, "loss": 1.3667, "step": 7510 }, { "epoch": 0.21, "learning_rate": 1.8434376471053157e-05, "loss": 1.4001, "step": 7511 }, { "epoch": 0.21, "learning_rate": 1.8433901256843147e-05, "loss": 1.3381, "step": 7512 }, { "epoch": 0.21, "learning_rate": 1.843342597665026e-05, "loss": 1.406, "step": 7513 }, { "epoch": 0.21, "learning_rate": 1.843295063047821e-05, "loss": 1.3701, "step": 7514 }, { "epoch": 0.21, "learning_rate": 1.8432475218330723e-05, "loss": 1.4495, "step": 7515 }, { "epoch": 0.21, "learning_rate": 1.8431999740211518e-05, "loss": 1.3689, "step": 7516 }, { "epoch": 0.21, "learning_rate": 1.8431524196124306e-05, "loss": 1.3284, "step": 7517 }, { "epoch": 0.21, "learning_rate": 1.8431048586072818e-05, "loss": 1.28, "step": 7518 }, { "epoch": 0.21, "learning_rate": 1.8430572910060767e-05, "loss": 1.4272, "step": 7519 }, { "epoch": 0.21, "learning_rate": 1.843009716809188e-05, "loss": 1.479, "step": 7520 }, { "epoch": 0.21, "learning_rate": 1.8429621360169876e-05, "loss": 1.4756, "step": 7521 }, { "epoch": 0.21, "learning_rate": 1.842914548629848e-05, "loss": 1.3799, "step": 7522 }, { "epoch": 0.21, "learning_rate": 1.842866954648141e-05, "loss": 1.4309, "step": 7523 }, { "epoch": 0.21, "learning_rate": 1.8428193540722396e-05, "loss": 1.3115, "step": 7524 }, { "epoch": 0.21, "learning_rate": 1.8427717469025158e-05, "loss": 1.4189, "step": 7525 }, { "epoch": 0.21, "learning_rate": 1.8427241331393422e-05, "loss": 1.3325, "step": 7526 }, { "epoch": 0.21, "learning_rate": 1.842676512783091e-05, "loss": 1.3491, "step": 7527 }, { "epoch": 0.21, "learning_rate": 1.8426288858341356e-05, "loss": 1.519, "step": 7528 }, { "epoch": 0.21, "learning_rate": 1.8425812522928474e-05, "loss": 1.324, "step": 7529 }, { "epoch": 0.21, "learning_rate": 1.8425336121596e-05, "loss": 1.668, "step": 7530 }, { "epoch": 0.21, "learning_rate": 1.842485965434766e-05, "loss": 1.3008, "step": 7531 }, { "epoch": 0.21, "learning_rate": 1.8424383121187175e-05, "loss": 1.5234, "step": 7532 }, { "epoch": 0.21, "learning_rate": 1.842390652211828e-05, "loss": 1.2654, "step": 7533 }, { "epoch": 0.21, "learning_rate": 1.84234298571447e-05, "loss": 1.406, "step": 7534 }, { "epoch": 0.21, "learning_rate": 1.842295312627017e-05, "loss": 1.4563, "step": 7535 }, { "epoch": 0.21, "learning_rate": 1.8422476329498415e-05, "loss": 1.5239, "step": 7536 }, { "epoch": 0.21, "learning_rate": 1.8421999466833164e-05, "loss": 1.3259, "step": 7537 }, { "epoch": 0.21, "learning_rate": 1.842152253827815e-05, "loss": 1.2922, "step": 7538 }, { "epoch": 0.21, "learning_rate": 1.84210455438371e-05, "loss": 1.3931, "step": 7539 }, { "epoch": 0.21, "learning_rate": 1.8420568483513752e-05, "loss": 1.301, "step": 7540 }, { "epoch": 0.21, "learning_rate": 1.8420091357311835e-05, "loss": 1.3557, "step": 7541 }, { "epoch": 0.21, "learning_rate": 1.8419614165235085e-05, "loss": 1.5391, "step": 7542 }, { "epoch": 0.21, "learning_rate": 1.8419136907287232e-05, "loss": 1.4995, "step": 7543 }, { "epoch": 0.21, "learning_rate": 1.8418659583472013e-05, "loss": 1.4785, "step": 7544 }, { "epoch": 0.21, "learning_rate": 1.8418182193793156e-05, "loss": 1.2844, "step": 7545 }, { "epoch": 0.21, "learning_rate": 1.8417704738254404e-05, "loss": 1.5002, "step": 7546 }, { "epoch": 0.21, "learning_rate": 1.8417227216859484e-05, "loss": 1.4355, "step": 7547 }, { "epoch": 0.21, "learning_rate": 1.841674962961214e-05, "loss": 1.75, "step": 7548 }, { "epoch": 0.21, "learning_rate": 1.84162719765161e-05, "loss": 1.3503, "step": 7549 }, { "epoch": 0.21, "learning_rate": 1.841579425757511e-05, "loss": 1.3694, "step": 7550 }, { "epoch": 0.21, "learning_rate": 1.84153164727929e-05, "loss": 1.4268, "step": 7551 }, { "epoch": 0.21, "learning_rate": 1.8414838622173214e-05, "loss": 1.4758, "step": 7552 }, { "epoch": 0.21, "learning_rate": 1.841436070571979e-05, "loss": 1.3286, "step": 7553 }, { "epoch": 0.21, "learning_rate": 1.841388272343636e-05, "loss": 1.5815, "step": 7554 }, { "epoch": 0.21, "learning_rate": 1.8413404675326667e-05, "loss": 1.6172, "step": 7555 }, { "epoch": 0.21, "learning_rate": 1.8412926561394456e-05, "loss": 1.7178, "step": 7556 }, { "epoch": 0.21, "learning_rate": 1.8412448381643462e-05, "loss": 1.3945, "step": 7557 }, { "epoch": 0.21, "learning_rate": 1.841197013607743e-05, "loss": 1.4663, "step": 7558 }, { "epoch": 0.21, "learning_rate": 1.8411491824700097e-05, "loss": 1.2021, "step": 7559 }, { "epoch": 0.21, "learning_rate": 1.8411013447515203e-05, "loss": 1.5042, "step": 7560 }, { "epoch": 0.21, "learning_rate": 1.8410535004526502e-05, "loss": 1.4739, "step": 7561 }, { "epoch": 0.21, "learning_rate": 1.8410056495737726e-05, "loss": 1.4304, "step": 7562 }, { "epoch": 0.21, "learning_rate": 1.8409577921152624e-05, "loss": 1.4863, "step": 7563 }, { "epoch": 0.21, "learning_rate": 1.840909928077494e-05, "loss": 1.4458, "step": 7564 }, { "epoch": 0.21, "learning_rate": 1.8408620574608415e-05, "loss": 1.3005, "step": 7565 }, { "epoch": 0.21, "learning_rate": 1.84081418026568e-05, "loss": 1.4653, "step": 7566 }, { "epoch": 0.21, "learning_rate": 1.8407662964923832e-05, "loss": 1.322, "step": 7567 }, { "epoch": 0.21, "learning_rate": 1.840718406141327e-05, "loss": 1.5166, "step": 7568 }, { "epoch": 0.21, "learning_rate": 1.8406705092128848e-05, "loss": 1.3357, "step": 7569 }, { "epoch": 0.21, "learning_rate": 1.8406226057074318e-05, "loss": 1.2239, "step": 7570 }, { "epoch": 0.21, "learning_rate": 1.8405746956253426e-05, "loss": 1.4155, "step": 7571 }, { "epoch": 0.21, "learning_rate": 1.840526778966993e-05, "loss": 1.3599, "step": 7572 }, { "epoch": 0.21, "learning_rate": 1.8404788557327565e-05, "loss": 1.3523, "step": 7573 }, { "epoch": 0.21, "learning_rate": 1.8404309259230087e-05, "loss": 1.2886, "step": 7574 }, { "epoch": 0.21, "learning_rate": 1.840382989538125e-05, "loss": 1.499, "step": 7575 }, { "epoch": 0.21, "learning_rate": 1.8403350465784794e-05, "loss": 1.2488, "step": 7576 }, { "epoch": 0.21, "learning_rate": 1.8402870970444483e-05, "loss": 1.3364, "step": 7577 }, { "epoch": 0.21, "learning_rate": 1.8402391409364055e-05, "loss": 1.3845, "step": 7578 }, { "epoch": 0.21, "learning_rate": 1.8401911782547266e-05, "loss": 1.3767, "step": 7579 }, { "epoch": 0.21, "learning_rate": 1.840143208999787e-05, "loss": 1.5039, "step": 7580 }, { "epoch": 0.21, "learning_rate": 1.8400952331719624e-05, "loss": 1.3279, "step": 7581 }, { "epoch": 0.21, "learning_rate": 1.840047250771628e-05, "loss": 1.459, "step": 7582 }, { "epoch": 0.21, "learning_rate": 1.8399992617991584e-05, "loss": 1.1899, "step": 7583 }, { "epoch": 0.21, "learning_rate": 1.83995126625493e-05, "loss": 1.3901, "step": 7584 }, { "epoch": 0.21, "learning_rate": 1.8399032641393174e-05, "loss": 1.3721, "step": 7585 }, { "epoch": 0.21, "learning_rate": 1.839855255452697e-05, "loss": 1.4082, "step": 7586 }, { "epoch": 0.21, "learning_rate": 1.8398072401954436e-05, "loss": 1.3291, "step": 7587 }, { "epoch": 0.21, "learning_rate": 1.8397592183679335e-05, "loss": 1.5142, "step": 7588 }, { "epoch": 0.21, "learning_rate": 1.839711189970542e-05, "loss": 1.4229, "step": 7589 }, { "epoch": 0.21, "learning_rate": 1.839663155003645e-05, "loss": 1.4797, "step": 7590 }, { "epoch": 0.21, "learning_rate": 1.8396151134676187e-05, "loss": 1.3027, "step": 7591 }, { "epoch": 0.21, "learning_rate": 1.839567065362838e-05, "loss": 1.3329, "step": 7592 }, { "epoch": 0.21, "learning_rate": 1.83951901068968e-05, "loss": 1.4302, "step": 7593 }, { "epoch": 0.21, "learning_rate": 1.8394709494485193e-05, "loss": 1.4302, "step": 7594 }, { "epoch": 0.21, "learning_rate": 1.839422881639733e-05, "loss": 1.5107, "step": 7595 }, { "epoch": 0.21, "learning_rate": 1.8393748072636973e-05, "loss": 1.2517, "step": 7596 }, { "epoch": 0.21, "learning_rate": 1.8393267263207874e-05, "loss": 1.426, "step": 7597 }, { "epoch": 0.21, "learning_rate": 1.8392786388113796e-05, "loss": 1.4639, "step": 7598 }, { "epoch": 0.21, "learning_rate": 1.8392305447358507e-05, "loss": 1.4402, "step": 7599 }, { "epoch": 0.21, "learning_rate": 1.8391824440945763e-05, "loss": 1.6001, "step": 7600 }, { "epoch": 0.21, "learning_rate": 1.8391343368879337e-05, "loss": 1.4978, "step": 7601 }, { "epoch": 0.21, "learning_rate": 1.839086223116298e-05, "loss": 1.3748, "step": 7602 }, { "epoch": 0.21, "learning_rate": 1.839038102780047e-05, "loss": 1.3213, "step": 7603 }, { "epoch": 0.21, "learning_rate": 1.838989975879556e-05, "loss": 1.3303, "step": 7604 }, { "epoch": 0.21, "learning_rate": 1.8389418424152016e-05, "loss": 1.5688, "step": 7605 }, { "epoch": 0.21, "learning_rate": 1.838893702387361e-05, "loss": 1.2827, "step": 7606 }, { "epoch": 0.21, "learning_rate": 1.8388455557964108e-05, "loss": 1.4243, "step": 7607 }, { "epoch": 0.21, "learning_rate": 1.838797402642727e-05, "loss": 1.3298, "step": 7608 }, { "epoch": 0.21, "learning_rate": 1.838749242926687e-05, "loss": 1.4382, "step": 7609 }, { "epoch": 0.21, "learning_rate": 1.8387010766486673e-05, "loss": 1.5078, "step": 7610 }, { "epoch": 0.21, "learning_rate": 1.838652903809045e-05, "loss": 1.2791, "step": 7611 }, { "epoch": 0.21, "learning_rate": 1.8386047244081964e-05, "loss": 1.3391, "step": 7612 }, { "epoch": 0.21, "learning_rate": 1.838556538446499e-05, "loss": 1.2954, "step": 7613 }, { "epoch": 0.21, "learning_rate": 1.838508345924329e-05, "loss": 1.2156, "step": 7614 }, { "epoch": 0.21, "learning_rate": 1.8384601468420648e-05, "loss": 1.3779, "step": 7615 }, { "epoch": 0.21, "learning_rate": 1.838411941200082e-05, "loss": 1.4082, "step": 7616 }, { "epoch": 0.21, "learning_rate": 1.8383637289987587e-05, "loss": 1.2998, "step": 7617 }, { "epoch": 0.21, "learning_rate": 1.838315510238472e-05, "loss": 1.4053, "step": 7618 }, { "epoch": 0.21, "learning_rate": 1.8382672849195988e-05, "loss": 1.4097, "step": 7619 }, { "epoch": 0.21, "learning_rate": 1.8382190530425165e-05, "loss": 1.3887, "step": 7620 }, { "epoch": 0.21, "learning_rate": 1.8381708146076025e-05, "loss": 1.2034, "step": 7621 }, { "epoch": 0.21, "learning_rate": 1.8381225696152342e-05, "loss": 1.4424, "step": 7622 }, { "epoch": 0.21, "learning_rate": 1.8380743180657893e-05, "loss": 1.7939, "step": 7623 }, { "epoch": 0.21, "learning_rate": 1.8380260599596447e-05, "loss": 1.4727, "step": 7624 }, { "epoch": 0.21, "learning_rate": 1.837977795297178e-05, "loss": 1.3462, "step": 7625 }, { "epoch": 0.21, "learning_rate": 1.8379295240787677e-05, "loss": 1.2925, "step": 7626 }, { "epoch": 0.21, "learning_rate": 1.8378812463047905e-05, "loss": 1.5317, "step": 7627 }, { "epoch": 0.21, "learning_rate": 1.8378329619756243e-05, "loss": 1.3237, "step": 7628 }, { "epoch": 0.21, "learning_rate": 1.8377846710916472e-05, "loss": 1.3655, "step": 7629 }, { "epoch": 0.21, "learning_rate": 1.8377363736532366e-05, "loss": 1.2124, "step": 7630 }, { "epoch": 0.21, "learning_rate": 1.8376880696607708e-05, "loss": 1.4575, "step": 7631 }, { "epoch": 0.21, "learning_rate": 1.8376397591146273e-05, "loss": 1.7041, "step": 7632 }, { "epoch": 0.21, "learning_rate": 1.8375914420151845e-05, "loss": 1.1768, "step": 7633 }, { "epoch": 0.21, "learning_rate": 1.8375431183628193e-05, "loss": 1.3069, "step": 7634 }, { "epoch": 0.21, "learning_rate": 1.8374947881579116e-05, "loss": 1.4756, "step": 7635 }, { "epoch": 0.21, "learning_rate": 1.8374464514008378e-05, "loss": 1.4883, "step": 7636 }, { "epoch": 0.21, "learning_rate": 1.837398108091977e-05, "loss": 1.332, "step": 7637 }, { "epoch": 0.21, "learning_rate": 1.8373497582317073e-05, "loss": 1.4604, "step": 7638 }, { "epoch": 0.21, "learning_rate": 1.8373014018204066e-05, "loss": 1.8379, "step": 7639 }, { "epoch": 0.21, "learning_rate": 1.8372530388584536e-05, "loss": 1.385, "step": 7640 }, { "epoch": 0.21, "learning_rate": 1.8372046693462264e-05, "loss": 1.5229, "step": 7641 }, { "epoch": 0.21, "learning_rate": 1.8371562932841035e-05, "loss": 1.2959, "step": 7642 }, { "epoch": 0.21, "learning_rate": 1.8371079106724637e-05, "loss": 1.4429, "step": 7643 }, { "epoch": 0.21, "learning_rate": 1.837059521511685e-05, "loss": 1.3633, "step": 7644 }, { "epoch": 0.21, "learning_rate": 1.8370111258021464e-05, "loss": 1.4551, "step": 7645 }, { "epoch": 0.21, "learning_rate": 1.8369627235442266e-05, "loss": 1.3999, "step": 7646 }, { "epoch": 0.21, "learning_rate": 1.8369143147383036e-05, "loss": 1.2893, "step": 7647 }, { "epoch": 0.21, "learning_rate": 1.8368658993847566e-05, "loss": 1.3801, "step": 7648 }, { "epoch": 0.21, "learning_rate": 1.836817477483964e-05, "loss": 1.2083, "step": 7649 }, { "epoch": 0.21, "learning_rate": 1.8367690490363056e-05, "loss": 1.3276, "step": 7650 }, { "epoch": 0.21, "learning_rate": 1.8367206140421592e-05, "loss": 1.2781, "step": 7651 }, { "epoch": 0.21, "learning_rate": 1.8366721725019046e-05, "loss": 1.2415, "step": 7652 }, { "epoch": 0.21, "learning_rate": 1.8366237244159197e-05, "loss": 1.7847, "step": 7653 }, { "epoch": 0.21, "learning_rate": 1.836575269784585e-05, "loss": 1.5454, "step": 7654 }, { "epoch": 0.21, "learning_rate": 1.836526808608278e-05, "loss": 1.4666, "step": 7655 }, { "epoch": 0.21, "learning_rate": 1.836478340887379e-05, "loss": 1.215, "step": 7656 }, { "epoch": 0.21, "learning_rate": 1.836429866622267e-05, "loss": 1.4165, "step": 7657 }, { "epoch": 0.21, "learning_rate": 1.8363813858133206e-05, "loss": 1.4319, "step": 7658 }, { "epoch": 0.21, "learning_rate": 1.8363328984609198e-05, "loss": 1.2886, "step": 7659 }, { "epoch": 0.21, "learning_rate": 1.8362844045654436e-05, "loss": 1.4229, "step": 7660 }, { "epoch": 0.21, "learning_rate": 1.8362359041272714e-05, "loss": 1.3481, "step": 7661 }, { "epoch": 0.21, "learning_rate": 1.8361873971467827e-05, "loss": 1.3142, "step": 7662 }, { "epoch": 0.21, "learning_rate": 1.836138883624357e-05, "loss": 1.2014, "step": 7663 }, { "epoch": 0.21, "learning_rate": 1.836090363560374e-05, "loss": 1.4434, "step": 7664 }, { "epoch": 0.21, "learning_rate": 1.836041836955213e-05, "loss": 1.467, "step": 7665 }, { "epoch": 0.21, "learning_rate": 1.8359933038092543e-05, "loss": 1.3267, "step": 7666 }, { "epoch": 0.21, "learning_rate": 1.8359447641228764e-05, "loss": 1.3999, "step": 7667 }, { "epoch": 0.21, "learning_rate": 1.83589621789646e-05, "loss": 1.261, "step": 7668 }, { "epoch": 0.21, "learning_rate": 1.8358476651303848e-05, "loss": 1.252, "step": 7669 }, { "epoch": 0.21, "learning_rate": 1.8357991058250305e-05, "loss": 1.3267, "step": 7670 }, { "epoch": 0.21, "learning_rate": 1.835750539980777e-05, "loss": 1.3613, "step": 7671 }, { "epoch": 0.21, "learning_rate": 1.835701967598004e-05, "loss": 1.3201, "step": 7672 }, { "epoch": 0.21, "learning_rate": 1.835653388677092e-05, "loss": 1.3667, "step": 7673 }, { "epoch": 0.21, "learning_rate": 1.835604803218421e-05, "loss": 1.3218, "step": 7674 }, { "epoch": 0.21, "learning_rate": 1.8355562112223707e-05, "loss": 1.3755, "step": 7675 }, { "epoch": 0.21, "learning_rate": 1.8355076126893214e-05, "loss": 1.4116, "step": 7676 }, { "epoch": 0.21, "learning_rate": 1.8354590076196537e-05, "loss": 1.3911, "step": 7677 }, { "epoch": 0.21, "learning_rate": 1.8354103960137476e-05, "loss": 1.4026, "step": 7678 }, { "epoch": 0.21, "learning_rate": 1.835361777871983e-05, "loss": 1.3235, "step": 7679 }, { "epoch": 0.21, "learning_rate": 1.835313153194741e-05, "loss": 1.4341, "step": 7680 }, { "epoch": 0.21, "learning_rate": 1.8352645219824017e-05, "loss": 1.1982, "step": 7681 }, { "epoch": 0.21, "learning_rate": 1.8352158842353455e-05, "loss": 1.4863, "step": 7682 }, { "epoch": 0.21, "learning_rate": 1.835167239953953e-05, "loss": 1.5967, "step": 7683 }, { "epoch": 0.21, "learning_rate": 1.8351185891386046e-05, "loss": 1.4536, "step": 7684 }, { "epoch": 0.21, "learning_rate": 1.8350699317896813e-05, "loss": 1.4829, "step": 7685 }, { "epoch": 0.21, "learning_rate": 1.8350212679075633e-05, "loss": 1.2642, "step": 7686 }, { "epoch": 0.21, "learning_rate": 1.8349725974926316e-05, "loss": 1.3638, "step": 7687 }, { "epoch": 0.21, "learning_rate": 1.834923920545267e-05, "loss": 1.4468, "step": 7688 }, { "epoch": 0.21, "learning_rate": 1.83487523706585e-05, "loss": 1.4539, "step": 7689 }, { "epoch": 0.21, "learning_rate": 1.834826547054762e-05, "loss": 1.386, "step": 7690 }, { "epoch": 0.21, "learning_rate": 1.8347778505123836e-05, "loss": 1.52, "step": 7691 }, { "epoch": 0.21, "learning_rate": 1.834729147439096e-05, "loss": 1.3154, "step": 7692 }, { "epoch": 0.21, "learning_rate": 1.83468043783528e-05, "loss": 1.4111, "step": 7693 }, { "epoch": 0.21, "learning_rate": 1.8346317217013166e-05, "loss": 1.4519, "step": 7694 }, { "epoch": 0.21, "learning_rate": 1.834582999037587e-05, "loss": 1.4556, "step": 7695 }, { "epoch": 0.21, "learning_rate": 1.8345342698444727e-05, "loss": 1.4526, "step": 7696 }, { "epoch": 0.21, "learning_rate": 1.8344855341223545e-05, "loss": 1.2751, "step": 7697 }, { "epoch": 0.21, "learning_rate": 1.834436791871614e-05, "loss": 1.417, "step": 7698 }, { "epoch": 0.21, "learning_rate": 1.8343880430926326e-05, "loss": 1.2966, "step": 7699 }, { "epoch": 0.21, "learning_rate": 1.8343392877857912e-05, "loss": 1.4329, "step": 7700 }, { "epoch": 0.21, "learning_rate": 1.8342905259514717e-05, "loss": 1.7153, "step": 7701 }, { "epoch": 0.21, "learning_rate": 1.8342417575900553e-05, "loss": 1.303, "step": 7702 }, { "epoch": 0.21, "learning_rate": 1.8341929827019237e-05, "loss": 1.282, "step": 7703 }, { "epoch": 0.21, "learning_rate": 1.8341442012874588e-05, "loss": 1.1025, "step": 7704 }, { "epoch": 0.21, "learning_rate": 1.8340954133470417e-05, "loss": 1.5229, "step": 7705 }, { "epoch": 0.21, "learning_rate": 1.834046618881054e-05, "loss": 1.3787, "step": 7706 }, { "epoch": 0.21, "learning_rate": 1.833997817889878e-05, "loss": 1.5859, "step": 7707 }, { "epoch": 0.21, "learning_rate": 1.8339490103738953e-05, "loss": 1.2566, "step": 7708 }, { "epoch": 0.21, "learning_rate": 1.833900196333488e-05, "loss": 1.3813, "step": 7709 }, { "epoch": 0.21, "learning_rate": 1.833851375769037e-05, "loss": 1.3064, "step": 7710 }, { "epoch": 0.21, "learning_rate": 1.8338025486809254e-05, "loss": 1.4131, "step": 7711 }, { "epoch": 0.21, "learning_rate": 1.8337537150695347e-05, "loss": 1.4023, "step": 7712 }, { "epoch": 0.21, "learning_rate": 1.8337048749352466e-05, "loss": 1.5005, "step": 7713 }, { "epoch": 0.21, "learning_rate": 1.833656028278444e-05, "loss": 1.3459, "step": 7714 }, { "epoch": 0.21, "learning_rate": 1.8336071750995087e-05, "loss": 1.4265, "step": 7715 }, { "epoch": 0.21, "learning_rate": 1.8335583153988226e-05, "loss": 1.3977, "step": 7716 }, { "epoch": 0.21, "learning_rate": 1.8335094491767685e-05, "loss": 1.4741, "step": 7717 }, { "epoch": 0.21, "learning_rate": 1.8334605764337283e-05, "loss": 1.3076, "step": 7718 }, { "epoch": 0.21, "learning_rate": 1.833411697170084e-05, "loss": 1.304, "step": 7719 }, { "epoch": 0.21, "learning_rate": 1.833362811386219e-05, "loss": 1.3835, "step": 7720 }, { "epoch": 0.21, "learning_rate": 1.833313919082515e-05, "loss": 1.3403, "step": 7721 }, { "epoch": 0.21, "learning_rate": 1.8332650202593552e-05, "loss": 1.1814, "step": 7722 }, { "epoch": 0.21, "learning_rate": 1.8332161149171213e-05, "loss": 1.2854, "step": 7723 }, { "epoch": 0.21, "learning_rate": 1.8331672030561965e-05, "loss": 1.5886, "step": 7724 }, { "epoch": 0.21, "learning_rate": 1.8331182846769627e-05, "loss": 1.4146, "step": 7725 }, { "epoch": 0.21, "learning_rate": 1.833069359779804e-05, "loss": 1.3403, "step": 7726 }, { "epoch": 0.21, "learning_rate": 1.833020428365102e-05, "loss": 1.4468, "step": 7727 }, { "epoch": 0.21, "learning_rate": 1.8329714904332402e-05, "loss": 1.3848, "step": 7728 }, { "epoch": 0.21, "learning_rate": 1.8329225459846007e-05, "loss": 1.3835, "step": 7729 }, { "epoch": 0.21, "learning_rate": 1.8328735950195667e-05, "loss": 1.2549, "step": 7730 }, { "epoch": 0.21, "learning_rate": 1.832824637538522e-05, "loss": 1.3284, "step": 7731 }, { "epoch": 0.21, "learning_rate": 1.8327756735418485e-05, "loss": 1.2947, "step": 7732 }, { "epoch": 0.21, "learning_rate": 1.83272670302993e-05, "loss": 1.3472, "step": 7733 }, { "epoch": 0.21, "learning_rate": 1.832677726003149e-05, "loss": 1.2495, "step": 7734 }, { "epoch": 0.21, "learning_rate": 1.8326287424618893e-05, "loss": 1.3921, "step": 7735 }, { "epoch": 0.21, "learning_rate": 1.8325797524065337e-05, "loss": 1.3655, "step": 7736 }, { "epoch": 0.21, "learning_rate": 1.8325307558374657e-05, "loss": 1.439, "step": 7737 }, { "epoch": 0.21, "learning_rate": 1.8324817527550687e-05, "loss": 1.5024, "step": 7738 }, { "epoch": 0.21, "learning_rate": 1.8324327431597257e-05, "loss": 1.4453, "step": 7739 }, { "epoch": 0.21, "learning_rate": 1.8323837270518207e-05, "loss": 1.459, "step": 7740 }, { "epoch": 0.21, "learning_rate": 1.8323347044317367e-05, "loss": 1.3633, "step": 7741 }, { "epoch": 0.21, "learning_rate": 1.832285675299857e-05, "loss": 1.4429, "step": 7742 }, { "epoch": 0.21, "learning_rate": 1.8322366396565657e-05, "loss": 1.2732, "step": 7743 }, { "epoch": 0.21, "learning_rate": 1.8321875975022465e-05, "loss": 1.3762, "step": 7744 }, { "epoch": 0.21, "learning_rate": 1.8321385488372827e-05, "loss": 1.4026, "step": 7745 }, { "epoch": 0.21, "learning_rate": 1.8320894936620583e-05, "loss": 1.3877, "step": 7746 }, { "epoch": 0.21, "learning_rate": 1.832040431976957e-05, "loss": 1.3599, "step": 7747 }, { "epoch": 0.21, "learning_rate": 1.8319913637823625e-05, "loss": 1.3672, "step": 7748 }, { "epoch": 0.21, "learning_rate": 1.8319422890786586e-05, "loss": 1.3804, "step": 7749 }, { "epoch": 0.21, "learning_rate": 1.8318932078662296e-05, "loss": 1.4531, "step": 7750 }, { "epoch": 0.21, "learning_rate": 1.8318441201454595e-05, "loss": 1.1555, "step": 7751 }, { "epoch": 0.21, "learning_rate": 1.831795025916732e-05, "loss": 1.2988, "step": 7752 }, { "epoch": 0.21, "learning_rate": 1.8317459251804315e-05, "loss": 1.22, "step": 7753 }, { "epoch": 0.21, "learning_rate": 1.8316968179369418e-05, "loss": 1.3652, "step": 7754 }, { "epoch": 0.21, "learning_rate": 1.8316477041866474e-05, "loss": 1.4412, "step": 7755 }, { "epoch": 0.21, "learning_rate": 1.8315985839299324e-05, "loss": 1.3203, "step": 7756 }, { "epoch": 0.21, "learning_rate": 1.831549457167181e-05, "loss": 1.415, "step": 7757 }, { "epoch": 0.21, "learning_rate": 1.831500323898778e-05, "loss": 1.2842, "step": 7758 }, { "epoch": 0.21, "learning_rate": 1.8314511841251072e-05, "loss": 1.2019, "step": 7759 }, { "epoch": 0.21, "learning_rate": 1.8314020378465535e-05, "loss": 1.2576, "step": 7760 }, { "epoch": 0.21, "learning_rate": 1.831352885063501e-05, "loss": 1.4023, "step": 7761 }, { "epoch": 0.21, "learning_rate": 1.8313037257763344e-05, "loss": 1.3479, "step": 7762 }, { "epoch": 0.21, "learning_rate": 1.8312545599854386e-05, "loss": 1.1357, "step": 7763 }, { "epoch": 0.21, "learning_rate": 1.831205387691198e-05, "loss": 1.4478, "step": 7764 }, { "epoch": 0.21, "learning_rate": 1.8311562088939973e-05, "loss": 1.3599, "step": 7765 }, { "epoch": 0.21, "learning_rate": 1.831107023594221e-05, "loss": 1.251, "step": 7766 }, { "epoch": 0.21, "learning_rate": 1.831057831792254e-05, "loss": 1.0593, "step": 7767 }, { "epoch": 0.21, "learning_rate": 1.831008633488482e-05, "loss": 1.4573, "step": 7768 }, { "epoch": 0.21, "learning_rate": 1.830959428683289e-05, "loss": 1.7754, "step": 7769 }, { "epoch": 0.21, "learning_rate": 1.8309102173770597e-05, "loss": 1.2842, "step": 7770 }, { "epoch": 0.21, "learning_rate": 1.83086099957018e-05, "loss": 1.3247, "step": 7771 }, { "epoch": 0.21, "learning_rate": 1.8308117752630344e-05, "loss": 1.3818, "step": 7772 }, { "epoch": 0.21, "learning_rate": 1.8307625444560085e-05, "loss": 1.4216, "step": 7773 }, { "epoch": 0.21, "learning_rate": 1.8307133071494866e-05, "loss": 1.4124, "step": 7774 }, { "epoch": 0.21, "learning_rate": 1.8306640633438548e-05, "loss": 1.2463, "step": 7775 }, { "epoch": 0.21, "learning_rate": 1.8306148130394978e-05, "loss": 1.4641, "step": 7776 }, { "epoch": 0.21, "learning_rate": 1.830565556236801e-05, "loss": 1.5059, "step": 7777 }, { "epoch": 0.21, "learning_rate": 1.83051629293615e-05, "loss": 1.4392, "step": 7778 }, { "epoch": 0.21, "learning_rate": 1.83046702313793e-05, "loss": 1.4109, "step": 7779 }, { "epoch": 0.21, "learning_rate": 1.8304177468425263e-05, "loss": 1.3911, "step": 7780 }, { "epoch": 0.21, "learning_rate": 1.830368464050325e-05, "loss": 1.4609, "step": 7781 }, { "epoch": 0.21, "learning_rate": 1.8303191747617114e-05, "loss": 1.1515, "step": 7782 }, { "epoch": 0.21, "learning_rate": 1.8302698789770706e-05, "loss": 1.4656, "step": 7783 }, { "epoch": 0.21, "learning_rate": 1.830220576696789e-05, "loss": 1.4075, "step": 7784 }, { "epoch": 0.21, "learning_rate": 1.8301712679212516e-05, "loss": 1.3596, "step": 7785 }, { "epoch": 0.21, "learning_rate": 1.830121952650845e-05, "loss": 1.3479, "step": 7786 }, { "epoch": 0.21, "learning_rate": 1.8300726308859543e-05, "loss": 1.5044, "step": 7787 }, { "epoch": 0.21, "learning_rate": 1.8300233026269658e-05, "loss": 1.3735, "step": 7788 }, { "epoch": 0.21, "learning_rate": 1.8299739678742653e-05, "loss": 1.3696, "step": 7789 }, { "epoch": 0.21, "learning_rate": 1.829924626628239e-05, "loss": 1.324, "step": 7790 }, { "epoch": 0.21, "learning_rate": 1.829875278889272e-05, "loss": 1.3435, "step": 7791 }, { "epoch": 0.21, "learning_rate": 1.8298259246577517e-05, "loss": 1.4341, "step": 7792 }, { "epoch": 0.21, "learning_rate": 1.8297765639340635e-05, "loss": 1.2839, "step": 7793 }, { "epoch": 0.21, "learning_rate": 1.8297271967185932e-05, "loss": 1.3853, "step": 7794 }, { "epoch": 0.21, "learning_rate": 1.829677823011728e-05, "loss": 1.5049, "step": 7795 }, { "epoch": 0.21, "learning_rate": 1.8296284428138532e-05, "loss": 1.3657, "step": 7796 }, { "epoch": 0.21, "learning_rate": 1.829579056125356e-05, "loss": 1.2703, "step": 7797 }, { "epoch": 0.21, "learning_rate": 1.8295296629466223e-05, "loss": 1.4854, "step": 7798 }, { "epoch": 0.21, "learning_rate": 1.8294802632780383e-05, "loss": 1.4878, "step": 7799 }, { "epoch": 0.21, "learning_rate": 1.829430857119991e-05, "loss": 1.2932, "step": 7800 }, { "epoch": 0.21, "learning_rate": 1.8293814444728665e-05, "loss": 1.3555, "step": 7801 }, { "epoch": 0.21, "learning_rate": 1.8293320253370517e-05, "loss": 1.4875, "step": 7802 }, { "epoch": 0.21, "learning_rate": 1.8292825997129334e-05, "loss": 1.3835, "step": 7803 }, { "epoch": 0.21, "learning_rate": 1.8292331676008978e-05, "loss": 1.3328, "step": 7804 }, { "epoch": 0.21, "learning_rate": 1.8291837290013315e-05, "loss": 1.3552, "step": 7805 }, { "epoch": 0.21, "learning_rate": 1.8291342839146217e-05, "loss": 1.2754, "step": 7806 }, { "epoch": 0.21, "learning_rate": 1.8290848323411554e-05, "loss": 1.3726, "step": 7807 }, { "epoch": 0.21, "learning_rate": 1.8290353742813192e-05, "loss": 1.3684, "step": 7808 }, { "epoch": 0.21, "learning_rate": 1.8289859097355e-05, "loss": 1.3091, "step": 7809 }, { "epoch": 0.21, "learning_rate": 1.828936438704085e-05, "loss": 1.3398, "step": 7810 }, { "epoch": 0.21, "learning_rate": 1.8288869611874608e-05, "loss": 1.4048, "step": 7811 }, { "epoch": 0.21, "learning_rate": 1.828837477186015e-05, "loss": 1.3315, "step": 7812 }, { "epoch": 0.21, "learning_rate": 1.8287879867001347e-05, "loss": 1.3931, "step": 7813 }, { "epoch": 0.21, "learning_rate": 1.8287384897302066e-05, "loss": 1.3945, "step": 7814 }, { "epoch": 0.21, "learning_rate": 1.8286889862766184e-05, "loss": 1.2849, "step": 7815 }, { "epoch": 0.21, "learning_rate": 1.828639476339757e-05, "loss": 1.3745, "step": 7816 }, { "epoch": 0.21, "learning_rate": 1.8285899599200104e-05, "loss": 1.3926, "step": 7817 }, { "epoch": 0.21, "learning_rate": 1.8285404370177654e-05, "loss": 1.7798, "step": 7818 }, { "epoch": 0.21, "learning_rate": 1.8284909076334094e-05, "loss": 1.332, "step": 7819 }, { "epoch": 0.21, "learning_rate": 1.8284413717673306e-05, "loss": 1.3281, "step": 7820 }, { "epoch": 0.21, "learning_rate": 1.8283918294199156e-05, "loss": 1.3901, "step": 7821 }, { "epoch": 0.21, "learning_rate": 1.828342280591553e-05, "loss": 1.3374, "step": 7822 }, { "epoch": 0.21, "learning_rate": 1.8282927252826295e-05, "loss": 1.3943, "step": 7823 }, { "epoch": 0.21, "learning_rate": 1.8282431634935333e-05, "loss": 1.6464, "step": 7824 }, { "epoch": 0.21, "learning_rate": 1.828193595224652e-05, "loss": 1.4028, "step": 7825 }, { "epoch": 0.21, "learning_rate": 1.8281440204763734e-05, "loss": 1.4058, "step": 7826 }, { "epoch": 0.21, "learning_rate": 1.8280944392490853e-05, "loss": 1.457, "step": 7827 }, { "epoch": 0.21, "learning_rate": 1.8280448515431763e-05, "loss": 1.4319, "step": 7828 }, { "epoch": 0.21, "learning_rate": 1.8279952573590332e-05, "loss": 1.4072, "step": 7829 }, { "epoch": 0.21, "learning_rate": 1.8279456566970448e-05, "loss": 1.3315, "step": 7830 }, { "epoch": 0.21, "learning_rate": 1.8278960495575985e-05, "loss": 1.479, "step": 7831 }, { "epoch": 0.21, "learning_rate": 1.8278464359410834e-05, "loss": 1.4158, "step": 7832 }, { "epoch": 0.21, "learning_rate": 1.8277968158478868e-05, "loss": 1.2786, "step": 7833 }, { "epoch": 0.21, "learning_rate": 1.827747189278397e-05, "loss": 1.4456, "step": 7834 }, { "epoch": 0.21, "learning_rate": 1.8276975562330025e-05, "loss": 1.4021, "step": 7835 }, { "epoch": 0.21, "learning_rate": 1.8276479167120918e-05, "loss": 1.7524, "step": 7836 }, { "epoch": 0.21, "learning_rate": 1.827598270716053e-05, "loss": 1.4277, "step": 7837 }, { "epoch": 0.21, "learning_rate": 1.8275486182452743e-05, "loss": 1.47, "step": 7838 }, { "epoch": 0.21, "learning_rate": 1.827498959300144e-05, "loss": 1.2766, "step": 7839 }, { "epoch": 0.21, "learning_rate": 1.8274492938810516e-05, "loss": 1.4143, "step": 7840 }, { "epoch": 0.21, "learning_rate": 1.8273996219883848e-05, "loss": 1.4204, "step": 7841 }, { "epoch": 0.21, "learning_rate": 1.8273499436225323e-05, "loss": 1.3542, "step": 7842 }, { "epoch": 0.21, "learning_rate": 1.827300258783883e-05, "loss": 1.3762, "step": 7843 }, { "epoch": 0.21, "learning_rate": 1.8272505674728254e-05, "loss": 1.2183, "step": 7844 }, { "epoch": 0.21, "learning_rate": 1.8272008696897485e-05, "loss": 1.2178, "step": 7845 }, { "epoch": 0.21, "learning_rate": 1.8271511654350407e-05, "loss": 1.0789, "step": 7846 }, { "epoch": 0.21, "learning_rate": 1.8271014547090917e-05, "loss": 1.5005, "step": 7847 }, { "epoch": 0.21, "learning_rate": 1.827051737512289e-05, "loss": 1.3755, "step": 7848 }, { "epoch": 0.21, "learning_rate": 1.8270020138450233e-05, "loss": 1.2793, "step": 7849 }, { "epoch": 0.21, "learning_rate": 1.8269522837076822e-05, "loss": 1.2559, "step": 7850 }, { "epoch": 0.21, "learning_rate": 1.826902547100655e-05, "loss": 1.4075, "step": 7851 }, { "epoch": 0.21, "learning_rate": 1.8268528040243318e-05, "loss": 1.2134, "step": 7852 }, { "epoch": 0.21, "learning_rate": 1.826803054479101e-05, "loss": 1.3184, "step": 7853 }, { "epoch": 0.21, "learning_rate": 1.8267532984653516e-05, "loss": 1.1788, "step": 7854 }, { "epoch": 0.21, "learning_rate": 1.826703535983473e-05, "loss": 1.3086, "step": 7855 }, { "epoch": 0.21, "learning_rate": 1.826653767033855e-05, "loss": 1.4463, "step": 7856 }, { "epoch": 0.21, "learning_rate": 1.826603991616887e-05, "loss": 1.4775, "step": 7857 }, { "epoch": 0.21, "learning_rate": 1.8265542097329572e-05, "loss": 1.3157, "step": 7858 }, { "epoch": 0.21, "learning_rate": 1.8265044213824566e-05, "loss": 1.2629, "step": 7859 }, { "epoch": 0.21, "learning_rate": 1.8264546265657735e-05, "loss": 1.2676, "step": 7860 }, { "epoch": 0.21, "learning_rate": 1.8264048252832983e-05, "loss": 1.3943, "step": 7861 }, { "epoch": 0.21, "learning_rate": 1.8263550175354206e-05, "loss": 1.4197, "step": 7862 }, { "epoch": 0.21, "learning_rate": 1.8263052033225298e-05, "loss": 1.3623, "step": 7863 }, { "epoch": 0.21, "learning_rate": 1.8262553826450157e-05, "loss": 1.4727, "step": 7864 }, { "epoch": 0.21, "learning_rate": 1.8262055555032673e-05, "loss": 1.5874, "step": 7865 }, { "epoch": 0.21, "learning_rate": 1.8261557218976757e-05, "loss": 1.5239, "step": 7866 }, { "epoch": 0.21, "learning_rate": 1.8261058818286305e-05, "loss": 1.3066, "step": 7867 }, { "epoch": 0.21, "learning_rate": 1.826056035296521e-05, "loss": 1.5066, "step": 7868 }, { "epoch": 0.21, "learning_rate": 1.8260061823017373e-05, "loss": 1.3733, "step": 7869 }, { "epoch": 0.21, "learning_rate": 1.82595632284467e-05, "loss": 1.5195, "step": 7870 }, { "epoch": 0.21, "learning_rate": 1.8259064569257085e-05, "loss": 1.2573, "step": 7871 }, { "epoch": 0.21, "learning_rate": 1.8258565845452434e-05, "loss": 1.3047, "step": 7872 }, { "epoch": 0.22, "learning_rate": 1.8258067057036648e-05, "loss": 1.2754, "step": 7873 }, { "epoch": 0.22, "learning_rate": 1.8257568204013627e-05, "loss": 1.3735, "step": 7874 }, { "epoch": 0.22, "learning_rate": 1.8257069286387278e-05, "loss": 1.4485, "step": 7875 }, { "epoch": 0.22, "learning_rate": 1.82565703041615e-05, "loss": 1.3501, "step": 7876 }, { "epoch": 0.22, "learning_rate": 1.82560712573402e-05, "loss": 1.4148, "step": 7877 }, { "epoch": 0.22, "learning_rate": 1.825557214592728e-05, "loss": 1.8569, "step": 7878 }, { "epoch": 0.22, "learning_rate": 1.8255072969926644e-05, "loss": 1.4563, "step": 7879 }, { "epoch": 0.22, "learning_rate": 1.82545737293422e-05, "loss": 1.832, "step": 7880 }, { "epoch": 0.22, "learning_rate": 1.825407442417785e-05, "loss": 1.5083, "step": 7881 }, { "epoch": 0.22, "learning_rate": 1.8253575054437506e-05, "loss": 1.3296, "step": 7882 }, { "epoch": 0.22, "learning_rate": 1.8253075620125074e-05, "loss": 1.4709, "step": 7883 }, { "epoch": 0.22, "learning_rate": 1.8252576121244455e-05, "loss": 1.2849, "step": 7884 }, { "epoch": 0.22, "learning_rate": 1.8252076557799563e-05, "loss": 1.4683, "step": 7885 }, { "epoch": 0.22, "learning_rate": 1.8251576929794305e-05, "loss": 1.4128, "step": 7886 }, { "epoch": 0.22, "learning_rate": 1.825107723723259e-05, "loss": 1.792, "step": 7887 }, { "epoch": 0.22, "learning_rate": 1.8250577480118324e-05, "loss": 1.3523, "step": 7888 }, { "epoch": 0.22, "learning_rate": 1.825007765845542e-05, "loss": 1.3838, "step": 7889 }, { "epoch": 0.22, "learning_rate": 1.8249577772247788e-05, "loss": 1.3896, "step": 7890 }, { "epoch": 0.22, "learning_rate": 1.824907782149934e-05, "loss": 1.4316, "step": 7891 }, { "epoch": 0.22, "learning_rate": 1.8248577806213986e-05, "loss": 1.2825, "step": 7892 }, { "epoch": 0.22, "learning_rate": 1.8248077726395634e-05, "loss": 1.3752, "step": 7893 }, { "epoch": 0.22, "learning_rate": 1.8247577582048205e-05, "loss": 1.293, "step": 7894 }, { "epoch": 0.22, "learning_rate": 1.8247077373175605e-05, "loss": 1.4331, "step": 7895 }, { "epoch": 0.22, "learning_rate": 1.824657709978175e-05, "loss": 1.1948, "step": 7896 }, { "epoch": 0.22, "learning_rate": 1.8246076761870556e-05, "loss": 1.3145, "step": 7897 }, { "epoch": 0.22, "learning_rate": 1.824557635944593e-05, "loss": 1.4751, "step": 7898 }, { "epoch": 0.22, "learning_rate": 1.8245075892511797e-05, "loss": 1.3342, "step": 7899 }, { "epoch": 0.22, "learning_rate": 1.8244575361072066e-05, "loss": 1.4224, "step": 7900 }, { "epoch": 0.22, "learning_rate": 1.8244074765130654e-05, "loss": 1.2993, "step": 7901 }, { "epoch": 0.22, "learning_rate": 1.8243574104691478e-05, "loss": 1.4619, "step": 7902 }, { "epoch": 0.22, "learning_rate": 1.8243073379758454e-05, "loss": 1.417, "step": 7903 }, { "epoch": 0.22, "learning_rate": 1.82425725903355e-05, "loss": 1.2627, "step": 7904 }, { "epoch": 0.22, "learning_rate": 1.824207173642653e-05, "loss": 1.4072, "step": 7905 }, { "epoch": 0.22, "learning_rate": 1.8241570818035472e-05, "loss": 1.5205, "step": 7906 }, { "epoch": 0.22, "learning_rate": 1.824106983516624e-05, "loss": 1.439, "step": 7907 }, { "epoch": 0.22, "learning_rate": 1.824056878782275e-05, "loss": 1.3757, "step": 7908 }, { "epoch": 0.22, "learning_rate": 1.8240067676008926e-05, "loss": 1.52, "step": 7909 }, { "epoch": 0.22, "learning_rate": 1.8239566499728684e-05, "loss": 1.2566, "step": 7910 }, { "epoch": 0.22, "learning_rate": 1.8239065258985952e-05, "loss": 1.2336, "step": 7911 }, { "epoch": 0.22, "learning_rate": 1.8238563953784646e-05, "loss": 1.2593, "step": 7912 }, { "epoch": 0.22, "learning_rate": 1.8238062584128693e-05, "loss": 1.9087, "step": 7913 }, { "epoch": 0.22, "learning_rate": 1.8237561150022006e-05, "loss": 1.3152, "step": 7914 }, { "epoch": 0.22, "learning_rate": 1.823705965146852e-05, "loss": 1.3252, "step": 7915 }, { "epoch": 0.22, "learning_rate": 1.823655808847215e-05, "loss": 1.4272, "step": 7916 }, { "epoch": 0.22, "learning_rate": 1.8236056461036824e-05, "loss": 1.3916, "step": 7917 }, { "epoch": 0.22, "learning_rate": 1.823555476916646e-05, "loss": 1.1626, "step": 7918 }, { "epoch": 0.22, "learning_rate": 1.8235053012864993e-05, "loss": 1.3931, "step": 7919 }, { "epoch": 0.22, "learning_rate": 1.823455119213634e-05, "loss": 1.436, "step": 7920 }, { "epoch": 0.22, "learning_rate": 1.8234049306984438e-05, "loss": 1.2578, "step": 7921 }, { "epoch": 0.22, "learning_rate": 1.8233547357413202e-05, "loss": 1.4246, "step": 7922 }, { "epoch": 0.22, "learning_rate": 1.8233045343426564e-05, "loss": 1.3257, "step": 7923 }, { "epoch": 0.22, "learning_rate": 1.8232543265028447e-05, "loss": 1.438, "step": 7924 }, { "epoch": 0.22, "learning_rate": 1.8232041122222785e-05, "loss": 1.27, "step": 7925 }, { "epoch": 0.22, "learning_rate": 1.82315389150135e-05, "loss": 1.4033, "step": 7926 }, { "epoch": 0.22, "learning_rate": 1.8231036643404533e-05, "loss": 1.3357, "step": 7927 }, { "epoch": 0.22, "learning_rate": 1.82305343073998e-05, "loss": 1.2712, "step": 7928 }, { "epoch": 0.22, "learning_rate": 1.823003190700324e-05, "loss": 1.3813, "step": 7929 }, { "epoch": 0.22, "learning_rate": 1.822952944221878e-05, "loss": 1.3052, "step": 7930 }, { "epoch": 0.22, "learning_rate": 1.8229026913050352e-05, "loss": 1.3464, "step": 7931 }, { "epoch": 0.22, "learning_rate": 1.8228524319501887e-05, "loss": 1.3569, "step": 7932 }, { "epoch": 0.22, "learning_rate": 1.8228021661577316e-05, "loss": 1.4194, "step": 7933 }, { "epoch": 0.22, "learning_rate": 1.8227518939280572e-05, "loss": 1.6309, "step": 7934 }, { "epoch": 0.22, "learning_rate": 1.8227016152615588e-05, "loss": 1.3618, "step": 7935 }, { "epoch": 0.22, "learning_rate": 1.82265133015863e-05, "loss": 1.291, "step": 7936 }, { "epoch": 0.22, "learning_rate": 1.822601038619664e-05, "loss": 1.2751, "step": 7937 }, { "epoch": 0.22, "learning_rate": 1.8225507406450545e-05, "loss": 1.7466, "step": 7938 }, { "epoch": 0.22, "learning_rate": 1.8225004362351943e-05, "loss": 1.3691, "step": 7939 }, { "epoch": 0.22, "learning_rate": 1.8224501253904778e-05, "loss": 1.3945, "step": 7940 }, { "epoch": 0.22, "learning_rate": 1.822399808111298e-05, "loss": 1.3875, "step": 7941 }, { "epoch": 0.22, "learning_rate": 1.822349484398049e-05, "loss": 1.3149, "step": 7942 }, { "epoch": 0.22, "learning_rate": 1.8222991542511247e-05, "loss": 1.3765, "step": 7943 }, { "epoch": 0.22, "learning_rate": 1.822248817670918e-05, "loss": 1.4744, "step": 7944 }, { "epoch": 0.22, "learning_rate": 1.822198474657823e-05, "loss": 1.3467, "step": 7945 }, { "epoch": 0.22, "learning_rate": 1.8221481252122345e-05, "loss": 1.3682, "step": 7946 }, { "epoch": 0.22, "learning_rate": 1.822097769334545e-05, "loss": 1.2769, "step": 7947 }, { "epoch": 0.22, "learning_rate": 1.822047407025149e-05, "loss": 1.1396, "step": 7948 }, { "epoch": 0.22, "learning_rate": 1.8219970382844414e-05, "loss": 1.3286, "step": 7949 }, { "epoch": 0.22, "learning_rate": 1.821946663112815e-05, "loss": 1.2781, "step": 7950 }, { "epoch": 0.22, "learning_rate": 1.8218962815106648e-05, "loss": 1.5232, "step": 7951 }, { "epoch": 0.22, "learning_rate": 1.821845893478384e-05, "loss": 1.4966, "step": 7952 }, { "epoch": 0.22, "learning_rate": 1.821795499016368e-05, "loss": 1.3965, "step": 7953 }, { "epoch": 0.22, "learning_rate": 1.82174509812501e-05, "loss": 1.4758, "step": 7954 }, { "epoch": 0.22, "learning_rate": 1.8216946908047052e-05, "loss": 1.2556, "step": 7955 }, { "epoch": 0.22, "learning_rate": 1.8216442770558468e-05, "loss": 1.4722, "step": 7956 }, { "epoch": 0.22, "learning_rate": 1.8215938568788306e-05, "loss": 1.4578, "step": 7957 }, { "epoch": 0.22, "learning_rate": 1.8215434302740504e-05, "loss": 1.2854, "step": 7958 }, { "epoch": 0.22, "learning_rate": 1.8214929972419004e-05, "loss": 1.3589, "step": 7959 }, { "epoch": 0.22, "learning_rate": 1.8214425577827755e-05, "loss": 1.4692, "step": 7960 }, { "epoch": 0.22, "learning_rate": 1.8213921118970703e-05, "loss": 1.3367, "step": 7961 }, { "epoch": 0.22, "learning_rate": 1.8213416595851796e-05, "loss": 1.3462, "step": 7962 }, { "epoch": 0.22, "learning_rate": 1.8212912008474977e-05, "loss": 1.1594, "step": 7963 }, { "epoch": 0.22, "learning_rate": 1.82124073568442e-05, "loss": 1.3408, "step": 7964 }, { "epoch": 0.22, "learning_rate": 1.821190264096341e-05, "loss": 1.2908, "step": 7965 }, { "epoch": 0.22, "learning_rate": 1.8211397860836554e-05, "loss": 1.4707, "step": 7966 }, { "epoch": 0.22, "learning_rate": 1.821089301646758e-05, "loss": 1.2371, "step": 7967 }, { "epoch": 0.22, "learning_rate": 1.8210388107860445e-05, "loss": 1.2881, "step": 7968 }, { "epoch": 0.22, "learning_rate": 1.8209883135019088e-05, "loss": 1.3718, "step": 7969 }, { "epoch": 0.22, "learning_rate": 1.820937809794747e-05, "loss": 1.3416, "step": 7970 }, { "epoch": 0.22, "learning_rate": 1.8208872996649538e-05, "loss": 1.3098, "step": 7971 }, { "epoch": 0.22, "learning_rate": 1.8208367831129243e-05, "loss": 1.283, "step": 7972 }, { "epoch": 0.22, "learning_rate": 1.8207862601390538e-05, "loss": 1.3213, "step": 7973 }, { "epoch": 0.22, "learning_rate": 1.8207357307437378e-05, "loss": 1.2373, "step": 7974 }, { "epoch": 0.22, "learning_rate": 1.820685194927371e-05, "loss": 1.3809, "step": 7975 }, { "epoch": 0.22, "learning_rate": 1.820634652690349e-05, "loss": 1.4001, "step": 7976 }, { "epoch": 0.22, "learning_rate": 1.8205841040330677e-05, "loss": 1.3188, "step": 7977 }, { "epoch": 0.22, "learning_rate": 1.8205335489559225e-05, "loss": 1.2063, "step": 7978 }, { "epoch": 0.22, "learning_rate": 1.8204829874593083e-05, "loss": 1.4607, "step": 7979 }, { "epoch": 0.22, "learning_rate": 1.820432419543621e-05, "loss": 1.374, "step": 7980 }, { "epoch": 0.22, "learning_rate": 1.8203818452092563e-05, "loss": 1.4482, "step": 7981 }, { "epoch": 0.22, "learning_rate": 1.8203312644566095e-05, "loss": 1.4648, "step": 7982 }, { "epoch": 0.22, "learning_rate": 1.820280677286077e-05, "loss": 1.2915, "step": 7983 }, { "epoch": 0.22, "learning_rate": 1.8202300836980543e-05, "loss": 1.3733, "step": 7984 }, { "epoch": 0.22, "learning_rate": 1.8201794836929368e-05, "loss": 1.3735, "step": 7985 }, { "epoch": 0.22, "learning_rate": 1.8201288772711212e-05, "loss": 1.3833, "step": 7986 }, { "epoch": 0.22, "learning_rate": 1.8200782644330022e-05, "loss": 1.4233, "step": 7987 }, { "epoch": 0.22, "learning_rate": 1.820027645178977e-05, "loss": 1.5659, "step": 7988 }, { "epoch": 0.22, "learning_rate": 1.819977019509441e-05, "loss": 1.3452, "step": 7989 }, { "epoch": 0.22, "learning_rate": 1.8199263874247905e-05, "loss": 1.4282, "step": 7990 }, { "epoch": 0.22, "learning_rate": 1.8198757489254214e-05, "loss": 1.3711, "step": 7991 }, { "epoch": 0.22, "learning_rate": 1.8198251040117297e-05, "loss": 1.3398, "step": 7992 }, { "epoch": 0.22, "learning_rate": 1.8197744526841124e-05, "loss": 1.4526, "step": 7993 }, { "epoch": 0.22, "learning_rate": 1.8197237949429653e-05, "loss": 1.3342, "step": 7994 }, { "epoch": 0.22, "learning_rate": 1.819673130788684e-05, "loss": 1.1106, "step": 7995 }, { "epoch": 0.22, "learning_rate": 1.819622460221666e-05, "loss": 1.3396, "step": 7996 }, { "epoch": 0.22, "learning_rate": 1.8195717832423075e-05, "loss": 1.2832, "step": 7997 }, { "epoch": 0.22, "learning_rate": 1.8195210998510044e-05, "loss": 1.457, "step": 7998 }, { "epoch": 0.22, "learning_rate": 1.8194704100481538e-05, "loss": 1.4229, "step": 7999 }, { "epoch": 0.22, "learning_rate": 1.819419713834152e-05, "loss": 1.3704, "step": 8000 }, { "epoch": 0.22, "learning_rate": 1.8193690112093953e-05, "loss": 1.3877, "step": 8001 }, { "epoch": 0.22, "learning_rate": 1.819318302174281e-05, "loss": 1.3425, "step": 8002 }, { "epoch": 0.22, "learning_rate": 1.819267586729206e-05, "loss": 1.3501, "step": 8003 }, { "epoch": 0.22, "learning_rate": 1.819216864874566e-05, "loss": 1.3198, "step": 8004 }, { "epoch": 0.22, "learning_rate": 1.819166136610759e-05, "loss": 1.4714, "step": 8005 }, { "epoch": 0.22, "learning_rate": 1.819115401938181e-05, "loss": 1.5146, "step": 8006 }, { "epoch": 0.22, "learning_rate": 1.8190646608572292e-05, "loss": 1.3176, "step": 8007 }, { "epoch": 0.22, "learning_rate": 1.819013913368301e-05, "loss": 1.3848, "step": 8008 }, { "epoch": 0.22, "learning_rate": 1.818963159471793e-05, "loss": 1.4438, "step": 8009 }, { "epoch": 0.22, "learning_rate": 1.818912399168102e-05, "loss": 1.4316, "step": 8010 }, { "epoch": 0.22, "learning_rate": 1.8188616324576257e-05, "loss": 1.3562, "step": 8011 }, { "epoch": 0.22, "learning_rate": 1.8188108593407608e-05, "loss": 1.2598, "step": 8012 }, { "epoch": 0.22, "learning_rate": 1.8187600798179053e-05, "loss": 1.4131, "step": 8013 }, { "epoch": 0.22, "learning_rate": 1.8187092938894557e-05, "loss": 1.2769, "step": 8014 }, { "epoch": 0.22, "learning_rate": 1.8186585015558096e-05, "loss": 1.2649, "step": 8015 }, { "epoch": 0.22, "learning_rate": 1.818607702817364e-05, "loss": 1.3848, "step": 8016 }, { "epoch": 0.22, "learning_rate": 1.818556897674517e-05, "loss": 1.3833, "step": 8017 }, { "epoch": 0.22, "learning_rate": 1.8185060861276657e-05, "loss": 1.219, "step": 8018 }, { "epoch": 0.22, "learning_rate": 1.818455268177208e-05, "loss": 1.2395, "step": 8019 }, { "epoch": 0.22, "learning_rate": 1.8184044438235404e-05, "loss": 1.1353, "step": 8020 }, { "epoch": 0.22, "learning_rate": 1.818353613067062e-05, "loss": 1.4194, "step": 8021 }, { "epoch": 0.22, "learning_rate": 1.818302775908169e-05, "loss": 1.4353, "step": 8022 }, { "epoch": 0.22, "learning_rate": 1.8182519323472605e-05, "loss": 1.4268, "step": 8023 }, { "epoch": 0.22, "learning_rate": 1.8182010823847335e-05, "loss": 1.4336, "step": 8024 }, { "epoch": 0.22, "learning_rate": 1.8181502260209857e-05, "loss": 1.3262, "step": 8025 }, { "epoch": 0.22, "learning_rate": 1.8180993632564156e-05, "loss": 1.4624, "step": 8026 }, { "epoch": 0.22, "learning_rate": 1.8180484940914206e-05, "loss": 1.3103, "step": 8027 }, { "epoch": 0.22, "learning_rate": 1.817997618526399e-05, "loss": 1.3689, "step": 8028 }, { "epoch": 0.22, "learning_rate": 1.8179467365617486e-05, "loss": 1.3213, "step": 8029 }, { "epoch": 0.22, "learning_rate": 1.8178958481978676e-05, "loss": 1.3462, "step": 8030 }, { "epoch": 0.22, "learning_rate": 1.817844953435154e-05, "loss": 1.4399, "step": 8031 }, { "epoch": 0.22, "learning_rate": 1.817794052274006e-05, "loss": 1.4082, "step": 8032 }, { "epoch": 0.22, "learning_rate": 1.8177431447148223e-05, "loss": 1.333, "step": 8033 }, { "epoch": 0.22, "learning_rate": 1.8176922307580003e-05, "loss": 1.3333, "step": 8034 }, { "epoch": 0.22, "learning_rate": 1.817641310403939e-05, "loss": 1.2869, "step": 8035 }, { "epoch": 0.22, "learning_rate": 1.8175903836530364e-05, "loss": 1.3733, "step": 8036 }, { "epoch": 0.22, "learning_rate": 1.8175394505056913e-05, "loss": 1.5112, "step": 8037 }, { "epoch": 0.22, "learning_rate": 1.817488510962302e-05, "loss": 1.2646, "step": 8038 }, { "epoch": 0.22, "learning_rate": 1.8174375650232667e-05, "loss": 1.3987, "step": 8039 }, { "epoch": 0.22, "learning_rate": 1.8173866126889844e-05, "loss": 1.2285, "step": 8040 }, { "epoch": 0.22, "learning_rate": 1.817335653959854e-05, "loss": 1.2537, "step": 8041 }, { "epoch": 0.22, "learning_rate": 1.8172846888362733e-05, "loss": 1.2422, "step": 8042 }, { "epoch": 0.22, "learning_rate": 1.8172337173186416e-05, "loss": 1.3618, "step": 8043 }, { "epoch": 0.22, "learning_rate": 1.8171827394073576e-05, "loss": 1.3223, "step": 8044 }, { "epoch": 0.22, "learning_rate": 1.8171317551028203e-05, "loss": 1.8696, "step": 8045 }, { "epoch": 0.22, "learning_rate": 1.8170807644054283e-05, "loss": 1.3235, "step": 8046 }, { "epoch": 0.22, "learning_rate": 1.8170297673155802e-05, "loss": 1.3408, "step": 8047 }, { "epoch": 0.22, "learning_rate": 1.816978763833676e-05, "loss": 1.4126, "step": 8048 }, { "epoch": 0.22, "learning_rate": 1.816927753960114e-05, "loss": 1.1169, "step": 8049 }, { "epoch": 0.22, "learning_rate": 1.8168767376952932e-05, "loss": 1.4019, "step": 8050 }, { "epoch": 0.22, "learning_rate": 1.816825715039613e-05, "loss": 1.4463, "step": 8051 }, { "epoch": 0.22, "learning_rate": 1.8167746859934724e-05, "loss": 1.3418, "step": 8052 }, { "epoch": 0.22, "learning_rate": 1.816723650557271e-05, "loss": 1.3621, "step": 8053 }, { "epoch": 0.22, "learning_rate": 1.8166726087314075e-05, "loss": 1.3567, "step": 8054 }, { "epoch": 0.22, "learning_rate": 1.8166215605162815e-05, "loss": 1.4785, "step": 8055 }, { "epoch": 0.22, "learning_rate": 1.8165705059122925e-05, "loss": 1.2429, "step": 8056 }, { "epoch": 0.22, "learning_rate": 1.81651944491984e-05, "loss": 1.2908, "step": 8057 }, { "epoch": 0.22, "learning_rate": 1.8164683775393234e-05, "loss": 1.3977, "step": 8058 }, { "epoch": 0.22, "learning_rate": 1.8164173037711422e-05, "loss": 1.2969, "step": 8059 }, { "epoch": 0.22, "learning_rate": 1.8163662236156956e-05, "loss": 1.4341, "step": 8060 }, { "epoch": 0.22, "learning_rate": 1.8163151370733838e-05, "loss": 1.3862, "step": 8061 }, { "epoch": 0.22, "learning_rate": 1.816264044144606e-05, "loss": 1.4353, "step": 8062 }, { "epoch": 0.22, "learning_rate": 1.816212944829762e-05, "loss": 1.1978, "step": 8063 }, { "epoch": 0.22, "learning_rate": 1.8161618391292523e-05, "loss": 1.4182, "step": 8064 }, { "epoch": 0.22, "learning_rate": 1.8161107270434757e-05, "loss": 1.3928, "step": 8065 }, { "epoch": 0.22, "learning_rate": 1.816059608572833e-05, "loss": 1.4849, "step": 8066 }, { "epoch": 0.22, "learning_rate": 1.816008483717723e-05, "loss": 1.3696, "step": 8067 }, { "epoch": 0.22, "learning_rate": 1.8159573524785467e-05, "loss": 1.2429, "step": 8068 }, { "epoch": 0.22, "learning_rate": 1.815906214855704e-05, "loss": 1.3982, "step": 8069 }, { "epoch": 0.22, "learning_rate": 1.8158550708495944e-05, "loss": 1.2998, "step": 8070 }, { "epoch": 0.22, "learning_rate": 1.8158039204606183e-05, "loss": 1.4985, "step": 8071 }, { "epoch": 0.22, "learning_rate": 1.815752763689176e-05, "loss": 1.2717, "step": 8072 }, { "epoch": 0.22, "learning_rate": 1.8157016005356677e-05, "loss": 1.2637, "step": 8073 }, { "epoch": 0.22, "learning_rate": 1.815650431000494e-05, "loss": 1.2275, "step": 8074 }, { "epoch": 0.22, "learning_rate": 1.8155992550840544e-05, "loss": 1.2678, "step": 8075 }, { "epoch": 0.22, "learning_rate": 1.8155480727867498e-05, "loss": 1.4099, "step": 8076 }, { "epoch": 0.22, "learning_rate": 1.815496884108981e-05, "loss": 1.3596, "step": 8077 }, { "epoch": 0.22, "learning_rate": 1.8154456890511477e-05, "loss": 1.3789, "step": 8078 }, { "epoch": 0.22, "learning_rate": 1.8153944876136508e-05, "loss": 1.4224, "step": 8079 }, { "epoch": 0.22, "learning_rate": 1.8153432797968908e-05, "loss": 1.3438, "step": 8080 }, { "epoch": 0.22, "learning_rate": 1.8152920656012684e-05, "loss": 1.4055, "step": 8081 }, { "epoch": 0.22, "learning_rate": 1.8152408450271847e-05, "loss": 1.4836, "step": 8082 }, { "epoch": 0.22, "learning_rate": 1.8151896180750394e-05, "loss": 1.479, "step": 8083 }, { "epoch": 0.22, "learning_rate": 1.815138384745234e-05, "loss": 1.3315, "step": 8084 }, { "epoch": 0.22, "learning_rate": 1.8150871450381692e-05, "loss": 1.366, "step": 8085 }, { "epoch": 0.22, "learning_rate": 1.815035898954246e-05, "loss": 1.3931, "step": 8086 }, { "epoch": 0.22, "learning_rate": 1.814984646493865e-05, "loss": 1.3896, "step": 8087 }, { "epoch": 0.22, "learning_rate": 1.8149333876574274e-05, "loss": 1.2561, "step": 8088 }, { "epoch": 0.22, "learning_rate": 1.8148821224453342e-05, "loss": 1.3894, "step": 8089 }, { "epoch": 0.22, "learning_rate": 1.8148308508579868e-05, "loss": 1.5713, "step": 8090 }, { "epoch": 0.22, "learning_rate": 1.8147795728957854e-05, "loss": 1.4324, "step": 8091 }, { "epoch": 0.22, "learning_rate": 1.8147282885591323e-05, "loss": 1.3093, "step": 8092 }, { "epoch": 0.22, "learning_rate": 1.814676997848428e-05, "loss": 1.8232, "step": 8093 }, { "epoch": 0.22, "learning_rate": 1.8146257007640737e-05, "loss": 1.4355, "step": 8094 }, { "epoch": 0.22, "learning_rate": 1.8145743973064713e-05, "loss": 1.3425, "step": 8095 }, { "epoch": 0.22, "learning_rate": 1.8145230874760214e-05, "loss": 1.3999, "step": 8096 }, { "epoch": 0.22, "learning_rate": 1.8144717712731265e-05, "loss": 1.2917, "step": 8097 }, { "epoch": 0.22, "learning_rate": 1.814420448698187e-05, "loss": 1.2795, "step": 8098 }, { "epoch": 0.22, "learning_rate": 1.8143691197516048e-05, "loss": 1.407, "step": 8099 }, { "epoch": 0.22, "learning_rate": 1.814317784433782e-05, "loss": 1.4377, "step": 8100 }, { "epoch": 0.22, "learning_rate": 1.8142664427451196e-05, "loss": 1.4717, "step": 8101 }, { "epoch": 0.22, "learning_rate": 1.8142150946860192e-05, "loss": 1.4021, "step": 8102 }, { "epoch": 0.22, "learning_rate": 1.814163740256883e-05, "loss": 1.248, "step": 8103 }, { "epoch": 0.22, "learning_rate": 1.8141123794581124e-05, "loss": 1.4199, "step": 8104 }, { "epoch": 0.22, "learning_rate": 1.8140610122901097e-05, "loss": 1.4092, "step": 8105 }, { "epoch": 0.22, "learning_rate": 1.814009638753276e-05, "loss": 1.3887, "step": 8106 }, { "epoch": 0.22, "learning_rate": 1.813958258848014e-05, "loss": 1.3838, "step": 8107 }, { "epoch": 0.22, "learning_rate": 1.8139068725747255e-05, "loss": 1.5811, "step": 8108 }, { "epoch": 0.22, "learning_rate": 1.8138554799338118e-05, "loss": 1.5547, "step": 8109 }, { "epoch": 0.22, "learning_rate": 1.813804080925676e-05, "loss": 1.4309, "step": 8110 }, { "epoch": 0.22, "learning_rate": 1.8137526755507193e-05, "loss": 1.3967, "step": 8111 }, { "epoch": 0.22, "learning_rate": 1.813701263809345e-05, "loss": 1.3674, "step": 8112 }, { "epoch": 0.22, "learning_rate": 1.8136498457019537e-05, "loss": 1.4067, "step": 8113 }, { "epoch": 0.22, "learning_rate": 1.813598421228949e-05, "loss": 1.4937, "step": 8114 }, { "epoch": 0.22, "learning_rate": 1.813546990390733e-05, "loss": 1.3376, "step": 8115 }, { "epoch": 0.22, "learning_rate": 1.813495553187708e-05, "loss": 1.3354, "step": 8116 }, { "epoch": 0.22, "learning_rate": 1.8134441096202762e-05, "loss": 1.3076, "step": 8117 }, { "epoch": 0.22, "learning_rate": 1.81339265968884e-05, "loss": 1.4951, "step": 8118 }, { "epoch": 0.22, "learning_rate": 1.8133412033938023e-05, "loss": 1.4221, "step": 8119 }, { "epoch": 0.22, "learning_rate": 1.8132897407355657e-05, "loss": 1.4463, "step": 8120 }, { "epoch": 0.22, "learning_rate": 1.813238271714532e-05, "loss": 1.333, "step": 8121 }, { "epoch": 0.22, "learning_rate": 1.813186796331105e-05, "loss": 1.4402, "step": 8122 }, { "epoch": 0.22, "learning_rate": 1.8131353145856866e-05, "loss": 1.3992, "step": 8123 }, { "epoch": 0.22, "learning_rate": 1.8130838264786802e-05, "loss": 1.3268, "step": 8124 }, { "epoch": 0.22, "learning_rate": 1.813032332010488e-05, "loss": 1.4016, "step": 8125 }, { "epoch": 0.22, "learning_rate": 1.812980831181513e-05, "loss": 1.3145, "step": 8126 }, { "epoch": 0.22, "learning_rate": 1.8129293239921584e-05, "loss": 1.2415, "step": 8127 }, { "epoch": 0.22, "learning_rate": 1.8128778104428274e-05, "loss": 1.2056, "step": 8128 }, { "epoch": 0.22, "learning_rate": 1.8128262905339226e-05, "loss": 1.426, "step": 8129 }, { "epoch": 0.22, "learning_rate": 1.8127747642658467e-05, "loss": 1.4568, "step": 8130 }, { "epoch": 0.22, "learning_rate": 1.8127232316390034e-05, "loss": 1.2336, "step": 8131 }, { "epoch": 0.22, "learning_rate": 1.8126716926537958e-05, "loss": 1.3486, "step": 8132 }, { "epoch": 0.22, "learning_rate": 1.8126201473106267e-05, "loss": 1.5378, "step": 8133 }, { "epoch": 0.22, "learning_rate": 1.8125685956099e-05, "loss": 1.417, "step": 8134 }, { "epoch": 0.22, "learning_rate": 1.8125170375520187e-05, "loss": 1.4263, "step": 8135 }, { "epoch": 0.22, "learning_rate": 1.812465473137386e-05, "loss": 1.4568, "step": 8136 }, { "epoch": 0.22, "learning_rate": 1.812413902366406e-05, "loss": 1.3391, "step": 8137 }, { "epoch": 0.22, "learning_rate": 1.8123623252394812e-05, "loss": 1.3704, "step": 8138 }, { "epoch": 0.22, "learning_rate": 1.8123107417570155e-05, "loss": 1.4067, "step": 8139 }, { "epoch": 0.22, "learning_rate": 1.8122591519194127e-05, "loss": 1.4277, "step": 8140 }, { "epoch": 0.22, "learning_rate": 1.8122075557270764e-05, "loss": 1.4304, "step": 8141 }, { "epoch": 0.22, "learning_rate": 1.8121559531804097e-05, "loss": 1.2842, "step": 8142 }, { "epoch": 0.22, "learning_rate": 1.8121043442798168e-05, "loss": 1.3972, "step": 8143 }, { "epoch": 0.22, "learning_rate": 1.8120527290257016e-05, "loss": 1.2664, "step": 8144 }, { "epoch": 0.22, "learning_rate": 1.8120011074184676e-05, "loss": 1.4688, "step": 8145 }, { "epoch": 0.22, "learning_rate": 1.811949479458519e-05, "loss": 1.4614, "step": 8146 }, { "epoch": 0.22, "learning_rate": 1.8118978451462595e-05, "loss": 1.219, "step": 8147 }, { "epoch": 0.22, "learning_rate": 1.8118462044820927e-05, "loss": 1.342, "step": 8148 }, { "epoch": 0.22, "learning_rate": 1.811794557466423e-05, "loss": 1.3284, "step": 8149 }, { "epoch": 0.22, "learning_rate": 1.8117429040996547e-05, "loss": 1.4629, "step": 8150 }, { "epoch": 0.22, "learning_rate": 1.8116912443821912e-05, "loss": 1.3484, "step": 8151 }, { "epoch": 0.22, "learning_rate": 1.8116395783144374e-05, "loss": 1.5032, "step": 8152 }, { "epoch": 0.22, "learning_rate": 1.811587905896797e-05, "loss": 1.3977, "step": 8153 }, { "epoch": 0.22, "learning_rate": 1.8115362271296747e-05, "loss": 1.3403, "step": 8154 }, { "epoch": 0.22, "learning_rate": 1.8114845420134743e-05, "loss": 1.2998, "step": 8155 }, { "epoch": 0.22, "learning_rate": 1.8114328505486004e-05, "loss": 1.2412, "step": 8156 }, { "epoch": 0.22, "learning_rate": 1.8113811527354577e-05, "loss": 1.4612, "step": 8157 }, { "epoch": 0.22, "learning_rate": 1.8113294485744503e-05, "loss": 1.4321, "step": 8158 }, { "epoch": 0.22, "learning_rate": 1.8112777380659826e-05, "loss": 1.481, "step": 8159 }, { "epoch": 0.22, "learning_rate": 1.81122602121046e-05, "loss": 1.3591, "step": 8160 }, { "epoch": 0.22, "learning_rate": 1.811174298008286e-05, "loss": 1.3862, "step": 8161 }, { "epoch": 0.22, "learning_rate": 1.8111225684598657e-05, "loss": 1.3755, "step": 8162 }, { "epoch": 0.22, "learning_rate": 1.8110708325656038e-05, "loss": 1.3862, "step": 8163 }, { "epoch": 0.22, "learning_rate": 1.8110190903259053e-05, "loss": 1.4148, "step": 8164 }, { "epoch": 0.22, "learning_rate": 1.8109673417411748e-05, "loss": 1.4429, "step": 8165 }, { "epoch": 0.22, "learning_rate": 1.8109155868118172e-05, "loss": 1.3271, "step": 8166 }, { "epoch": 0.22, "learning_rate": 1.810863825538237e-05, "loss": 1.2891, "step": 8167 }, { "epoch": 0.22, "learning_rate": 1.81081205792084e-05, "loss": 1.4548, "step": 8168 }, { "epoch": 0.22, "learning_rate": 1.8107602839600306e-05, "loss": 1.3879, "step": 8169 }, { "epoch": 0.22, "learning_rate": 1.8107085036562137e-05, "loss": 1.3542, "step": 8170 }, { "epoch": 0.22, "learning_rate": 1.8106567170097948e-05, "loss": 1.4138, "step": 8171 }, { "epoch": 0.22, "learning_rate": 1.810604924021179e-05, "loss": 1.3831, "step": 8172 }, { "epoch": 0.22, "learning_rate": 1.810553124690772e-05, "loss": 1.3369, "step": 8173 }, { "epoch": 0.22, "learning_rate": 1.8105013190189775e-05, "loss": 1.4539, "step": 8174 }, { "epoch": 0.22, "learning_rate": 1.8104495070062024e-05, "loss": 1.396, "step": 8175 }, { "epoch": 0.22, "learning_rate": 1.8103976886528514e-05, "loss": 1.5, "step": 8176 }, { "epoch": 0.22, "learning_rate": 1.81034586395933e-05, "loss": 1.2563, "step": 8177 }, { "epoch": 0.22, "learning_rate": 1.810294032926043e-05, "loss": 1.5276, "step": 8178 }, { "epoch": 0.22, "learning_rate": 1.8102421955533974e-05, "loss": 1.4111, "step": 8179 }, { "epoch": 0.22, "learning_rate": 1.8101903518417972e-05, "loss": 1.4436, "step": 8180 }, { "epoch": 0.22, "learning_rate": 1.810138501791649e-05, "loss": 1.3108, "step": 8181 }, { "epoch": 0.22, "learning_rate": 1.8100866454033582e-05, "loss": 1.28, "step": 8182 }, { "epoch": 0.22, "learning_rate": 1.8100347826773304e-05, "loss": 1.3489, "step": 8183 }, { "epoch": 0.22, "learning_rate": 1.809982913613971e-05, "loss": 1.3228, "step": 8184 }, { "epoch": 0.22, "learning_rate": 1.8099310382136866e-05, "loss": 1.3733, "step": 8185 }, { "epoch": 0.22, "learning_rate": 1.8098791564768825e-05, "loss": 1.4414, "step": 8186 }, { "epoch": 0.22, "learning_rate": 1.8098272684039647e-05, "loss": 1.2263, "step": 8187 }, { "epoch": 0.22, "learning_rate": 1.809775373995339e-05, "loss": 1.3069, "step": 8188 }, { "epoch": 0.22, "learning_rate": 1.8097234732514116e-05, "loss": 1.3052, "step": 8189 }, { "epoch": 0.22, "learning_rate": 1.809671566172589e-05, "loss": 1.3118, "step": 8190 }, { "epoch": 0.22, "learning_rate": 1.809619652759276e-05, "loss": 1.2322, "step": 8191 }, { "epoch": 0.22, "learning_rate": 1.80956773301188e-05, "loss": 1.2976, "step": 8192 }, { "epoch": 0.22, "learning_rate": 1.8095158069308065e-05, "loss": 1.3423, "step": 8193 }, { "epoch": 0.22, "learning_rate": 1.809463874516462e-05, "loss": 1.5308, "step": 8194 }, { "epoch": 0.22, "learning_rate": 1.8094119357692532e-05, "loss": 1.4675, "step": 8195 }, { "epoch": 0.22, "learning_rate": 1.809359990689586e-05, "loss": 1.4255, "step": 8196 }, { "epoch": 0.22, "learning_rate": 1.809308039277866e-05, "loss": 1.3877, "step": 8197 }, { "epoch": 0.22, "learning_rate": 1.8092560815345012e-05, "loss": 1.4121, "step": 8198 }, { "epoch": 0.22, "learning_rate": 1.8092041174598974e-05, "loss": 1.4417, "step": 8199 }, { "epoch": 0.22, "learning_rate": 1.809152147054461e-05, "loss": 1.3594, "step": 8200 }, { "epoch": 0.22, "learning_rate": 1.8091001703185983e-05, "loss": 1.3789, "step": 8201 }, { "epoch": 0.22, "learning_rate": 1.809048187252717e-05, "loss": 1.3242, "step": 8202 }, { "epoch": 0.22, "learning_rate": 1.8089961978572222e-05, "loss": 1.3521, "step": 8203 }, { "epoch": 0.22, "learning_rate": 1.808944202132522e-05, "loss": 1.3337, "step": 8204 }, { "epoch": 0.22, "learning_rate": 1.8088922000790233e-05, "loss": 1.2629, "step": 8205 }, { "epoch": 0.22, "learning_rate": 1.808840191697132e-05, "loss": 1.2432, "step": 8206 }, { "epoch": 0.22, "learning_rate": 1.808788176987255e-05, "loss": 1.3813, "step": 8207 }, { "epoch": 0.22, "learning_rate": 1.8087361559498e-05, "loss": 1.3735, "step": 8208 }, { "epoch": 0.22, "learning_rate": 1.8086841285851736e-05, "loss": 1.4517, "step": 8209 }, { "epoch": 0.22, "learning_rate": 1.808632094893783e-05, "loss": 1.311, "step": 8210 }, { "epoch": 0.22, "learning_rate": 1.808580054876035e-05, "loss": 1.4878, "step": 8211 }, { "epoch": 0.22, "learning_rate": 1.8085280085323367e-05, "loss": 1.5051, "step": 8212 }, { "epoch": 0.22, "learning_rate": 1.8084759558630956e-05, "loss": 1.4526, "step": 8213 }, { "epoch": 0.22, "learning_rate": 1.808423896868719e-05, "loss": 1.187, "step": 8214 }, { "epoch": 0.22, "learning_rate": 1.8083718315496134e-05, "loss": 1.4111, "step": 8215 }, { "epoch": 0.22, "learning_rate": 1.8083197599061872e-05, "loss": 1.4341, "step": 8216 }, { "epoch": 0.22, "learning_rate": 1.8082676819388472e-05, "loss": 1.3513, "step": 8217 }, { "epoch": 0.22, "learning_rate": 1.8082155976480007e-05, "loss": 1.3149, "step": 8218 }, { "epoch": 0.22, "learning_rate": 1.808163507034056e-05, "loss": 1.3225, "step": 8219 }, { "epoch": 0.22, "learning_rate": 1.8081114100974195e-05, "loss": 1.3965, "step": 8220 }, { "epoch": 0.22, "learning_rate": 1.8080593068384993e-05, "loss": 1.2925, "step": 8221 }, { "epoch": 0.22, "learning_rate": 1.808007197257703e-05, "loss": 1.3628, "step": 8222 }, { "epoch": 0.22, "learning_rate": 1.807955081355439e-05, "loss": 1.3777, "step": 8223 }, { "epoch": 0.22, "learning_rate": 1.8079029591321138e-05, "loss": 1.2485, "step": 8224 }, { "epoch": 0.22, "learning_rate": 1.807850830588136e-05, "loss": 1.374, "step": 8225 }, { "epoch": 0.22, "learning_rate": 1.807798695723913e-05, "loss": 1.4004, "step": 8226 }, { "epoch": 0.22, "learning_rate": 1.807746554539853e-05, "loss": 1.2844, "step": 8227 }, { "epoch": 0.22, "learning_rate": 1.8076944070363637e-05, "loss": 1.2913, "step": 8228 }, { "epoch": 0.22, "learning_rate": 1.807642253213853e-05, "loss": 1.5039, "step": 8229 }, { "epoch": 0.22, "learning_rate": 1.8075900930727294e-05, "loss": 1.303, "step": 8230 }, { "epoch": 0.22, "learning_rate": 1.8075379266134007e-05, "loss": 1.7739, "step": 8231 }, { "epoch": 0.22, "learning_rate": 1.8074857538362748e-05, "loss": 1.2661, "step": 8232 }, { "epoch": 0.22, "learning_rate": 1.8074335747417603e-05, "loss": 1.3552, "step": 8233 }, { "epoch": 0.22, "learning_rate": 1.807381389330265e-05, "loss": 1.3728, "step": 8234 }, { "epoch": 0.22, "learning_rate": 1.807329197602197e-05, "loss": 1.3867, "step": 8235 }, { "epoch": 0.22, "learning_rate": 1.8072769995579656e-05, "loss": 1.3171, "step": 8236 }, { "epoch": 0.22, "learning_rate": 1.8072247951979785e-05, "loss": 1.3379, "step": 8237 }, { "epoch": 0.22, "learning_rate": 1.8071725845226436e-05, "loss": 1.406, "step": 8238 }, { "epoch": 0.23, "learning_rate": 1.8071203675323708e-05, "loss": 1.4065, "step": 8239 }, { "epoch": 0.23, "learning_rate": 1.807068144227567e-05, "loss": 1.4673, "step": 8240 }, { "epoch": 0.23, "learning_rate": 1.807015914608642e-05, "loss": 1.2717, "step": 8241 }, { "epoch": 0.23, "learning_rate": 1.806963678676004e-05, "loss": 1.4502, "step": 8242 }, { "epoch": 0.23, "learning_rate": 1.8069114364300615e-05, "loss": 1.4595, "step": 8243 }, { "epoch": 0.23, "learning_rate": 1.8068591878712234e-05, "loss": 1.4185, "step": 8244 }, { "epoch": 0.23, "learning_rate": 1.8068069329998984e-05, "loss": 1.4863, "step": 8245 }, { "epoch": 0.23, "learning_rate": 1.8067546718164953e-05, "loss": 1.4336, "step": 8246 }, { "epoch": 0.23, "learning_rate": 1.806702404321423e-05, "loss": 1.3516, "step": 8247 }, { "epoch": 0.23, "learning_rate": 1.8066501305150904e-05, "loss": 1.49, "step": 8248 }, { "epoch": 0.23, "learning_rate": 1.8065978503979063e-05, "loss": 1.7407, "step": 8249 }, { "epoch": 0.23, "learning_rate": 1.8065455639702804e-05, "loss": 1.4614, "step": 8250 }, { "epoch": 0.23, "learning_rate": 1.8064932712326212e-05, "loss": 1.3101, "step": 8251 }, { "epoch": 0.23, "learning_rate": 1.8064409721853377e-05, "loss": 1.3069, "step": 8252 }, { "epoch": 0.23, "learning_rate": 1.8063886668288392e-05, "loss": 1.3755, "step": 8253 }, { "epoch": 0.23, "learning_rate": 1.8063363551635353e-05, "loss": 1.4663, "step": 8254 }, { "epoch": 0.23, "learning_rate": 1.8062840371898345e-05, "loss": 1.3809, "step": 8255 }, { "epoch": 0.23, "learning_rate": 1.8062317129081466e-05, "loss": 1.415, "step": 8256 }, { "epoch": 0.23, "learning_rate": 1.806179382318881e-05, "loss": 1.429, "step": 8257 }, { "epoch": 0.23, "learning_rate": 1.806127045422447e-05, "loss": 1.4133, "step": 8258 }, { "epoch": 0.23, "learning_rate": 1.806074702219254e-05, "loss": 1.3696, "step": 8259 }, { "epoch": 0.23, "learning_rate": 1.8060223527097117e-05, "loss": 1.4409, "step": 8260 }, { "epoch": 0.23, "learning_rate": 1.8059699968942296e-05, "loss": 1.2581, "step": 8261 }, { "epoch": 0.23, "learning_rate": 1.805917634773217e-05, "loss": 1.1453, "step": 8262 }, { "epoch": 0.23, "learning_rate": 1.805865266347084e-05, "loss": 1.4858, "step": 8263 }, { "epoch": 0.23, "learning_rate": 1.8058128916162402e-05, "loss": 1.4089, "step": 8264 }, { "epoch": 0.23, "learning_rate": 1.8057605105810948e-05, "loss": 1.3718, "step": 8265 }, { "epoch": 0.23, "learning_rate": 1.8057081232420584e-05, "loss": 1.4966, "step": 8266 }, { "epoch": 0.23, "learning_rate": 1.8056557295995404e-05, "loss": 1.7402, "step": 8267 }, { "epoch": 0.23, "learning_rate": 1.8056033296539508e-05, "loss": 1.4602, "step": 8268 }, { "epoch": 0.23, "learning_rate": 1.8055509234056997e-05, "loss": 1.2585, "step": 8269 }, { "epoch": 0.23, "learning_rate": 1.8054985108551966e-05, "loss": 1.2629, "step": 8270 }, { "epoch": 0.23, "learning_rate": 1.8054460920028524e-05, "loss": 1.4946, "step": 8271 }, { "epoch": 0.23, "learning_rate": 1.8053936668490767e-05, "loss": 1.4221, "step": 8272 }, { "epoch": 0.23, "learning_rate": 1.8053412353942792e-05, "loss": 1.3997, "step": 8273 }, { "epoch": 0.23, "learning_rate": 1.805288797638871e-05, "loss": 1.4338, "step": 8274 }, { "epoch": 0.23, "learning_rate": 1.8052363535832618e-05, "loss": 1.3735, "step": 8275 }, { "epoch": 0.23, "learning_rate": 1.805183903227862e-05, "loss": 1.3999, "step": 8276 }, { "epoch": 0.23, "learning_rate": 1.805131446573082e-05, "loss": 1.3352, "step": 8277 }, { "epoch": 0.23, "learning_rate": 1.8050789836193324e-05, "loss": 1.4365, "step": 8278 }, { "epoch": 0.23, "learning_rate": 1.805026514367023e-05, "loss": 1.5635, "step": 8279 }, { "epoch": 0.23, "learning_rate": 1.804974038816565e-05, "loss": 1.2544, "step": 8280 }, { "epoch": 0.23, "learning_rate": 1.8049215569683682e-05, "loss": 1.3857, "step": 8281 }, { "epoch": 0.23, "learning_rate": 1.804869068822844e-05, "loss": 1.293, "step": 8282 }, { "epoch": 0.23, "learning_rate": 1.8048165743804028e-05, "loss": 1.2153, "step": 8283 }, { "epoch": 0.23, "learning_rate": 1.804764073641455e-05, "loss": 1.3931, "step": 8284 }, { "epoch": 0.23, "learning_rate": 1.8047115666064114e-05, "loss": 1.4019, "step": 8285 }, { "epoch": 0.23, "learning_rate": 1.8046590532756833e-05, "loss": 1.4385, "step": 8286 }, { "epoch": 0.23, "learning_rate": 1.8046065336496806e-05, "loss": 1.5581, "step": 8287 }, { "epoch": 0.23, "learning_rate": 1.804554007728815e-05, "loss": 1.271, "step": 8288 }, { "epoch": 0.23, "learning_rate": 1.804501475513497e-05, "loss": 1.3853, "step": 8289 }, { "epoch": 0.23, "learning_rate": 1.804448937004138e-05, "loss": 1.457, "step": 8290 }, { "epoch": 0.23, "learning_rate": 1.8043963922011488e-05, "loss": 1.408, "step": 8291 }, { "epoch": 0.23, "learning_rate": 1.8043438411049404e-05, "loss": 1.3931, "step": 8292 }, { "epoch": 0.23, "learning_rate": 1.804291283715924e-05, "loss": 1.4121, "step": 8293 }, { "epoch": 0.23, "learning_rate": 1.8042387200345108e-05, "loss": 1.7476, "step": 8294 }, { "epoch": 0.23, "learning_rate": 1.8041861500611123e-05, "loss": 1.2676, "step": 8295 }, { "epoch": 0.23, "learning_rate": 1.804133573796139e-05, "loss": 1.2854, "step": 8296 }, { "epoch": 0.23, "learning_rate": 1.804080991240003e-05, "loss": 1.3936, "step": 8297 }, { "epoch": 0.23, "learning_rate": 1.8040284023931154e-05, "loss": 1.3989, "step": 8298 }, { "epoch": 0.23, "learning_rate": 1.803975807255888e-05, "loss": 1.4329, "step": 8299 }, { "epoch": 0.23, "learning_rate": 1.8039232058287314e-05, "loss": 1.2651, "step": 8300 }, { "epoch": 0.23, "learning_rate": 1.803870598112058e-05, "loss": 1.2493, "step": 8301 }, { "epoch": 0.23, "learning_rate": 1.803817984106279e-05, "loss": 1.498, "step": 8302 }, { "epoch": 0.23, "learning_rate": 1.803765363811806e-05, "loss": 1.3936, "step": 8303 }, { "epoch": 0.23, "learning_rate": 1.8037127372290507e-05, "loss": 1.4414, "step": 8304 }, { "epoch": 0.23, "learning_rate": 1.803660104358425e-05, "loss": 1.3716, "step": 8305 }, { "epoch": 0.23, "learning_rate": 1.8036074652003405e-05, "loss": 1.3906, "step": 8306 }, { "epoch": 0.23, "learning_rate": 1.8035548197552093e-05, "loss": 1.1335, "step": 8307 }, { "epoch": 0.23, "learning_rate": 1.8035021680234427e-05, "loss": 1.4392, "step": 8308 }, { "epoch": 0.23, "learning_rate": 1.803449510005453e-05, "loss": 1.2546, "step": 8309 }, { "epoch": 0.23, "learning_rate": 1.803396845701652e-05, "loss": 1.6577, "step": 8310 }, { "epoch": 0.23, "learning_rate": 1.8033441751124526e-05, "loss": 1.3638, "step": 8311 }, { "epoch": 0.23, "learning_rate": 1.8032914982382656e-05, "loss": 1.3267, "step": 8312 }, { "epoch": 0.23, "learning_rate": 1.8032388150795034e-05, "loss": 1.1572, "step": 8313 }, { "epoch": 0.23, "learning_rate": 1.803186125636579e-05, "loss": 1.3752, "step": 8314 }, { "epoch": 0.23, "learning_rate": 1.8031334299099037e-05, "loss": 1.4761, "step": 8315 }, { "epoch": 0.23, "learning_rate": 1.80308072789989e-05, "loss": 1.3933, "step": 8316 }, { "epoch": 0.23, "learning_rate": 1.8030280196069507e-05, "loss": 1.6099, "step": 8317 }, { "epoch": 0.23, "learning_rate": 1.8029753050314976e-05, "loss": 1.3711, "step": 8318 }, { "epoch": 0.23, "learning_rate": 1.8029225841739434e-05, "loss": 1.4541, "step": 8319 }, { "epoch": 0.23, "learning_rate": 1.8028698570347e-05, "loss": 1.3887, "step": 8320 }, { "epoch": 0.23, "learning_rate": 1.802817123614181e-05, "loss": 1.5022, "step": 8321 }, { "epoch": 0.23, "learning_rate": 1.802764383912798e-05, "loss": 1.385, "step": 8322 }, { "epoch": 0.23, "learning_rate": 1.8027116379309637e-05, "loss": 1.2656, "step": 8323 }, { "epoch": 0.23, "learning_rate": 1.8026588856690913e-05, "loss": 1.354, "step": 8324 }, { "epoch": 0.23, "learning_rate": 1.8026061271275935e-05, "loss": 1.52, "step": 8325 }, { "epoch": 0.23, "learning_rate": 1.8025533623068822e-05, "loss": 1.2793, "step": 8326 }, { "epoch": 0.23, "learning_rate": 1.8025005912073712e-05, "loss": 1.2642, "step": 8327 }, { "epoch": 0.23, "learning_rate": 1.8024478138294727e-05, "loss": 1.3315, "step": 8328 }, { "epoch": 0.23, "learning_rate": 1.8023950301736e-05, "loss": 1.3572, "step": 8329 }, { "epoch": 0.23, "learning_rate": 1.802342240240166e-05, "loss": 1.5059, "step": 8330 }, { "epoch": 0.23, "learning_rate": 1.8022894440295834e-05, "loss": 1.4268, "step": 8331 }, { "epoch": 0.23, "learning_rate": 1.8022366415422653e-05, "loss": 1.239, "step": 8332 }, { "epoch": 0.23, "learning_rate": 1.802183832778625e-05, "loss": 1.4902, "step": 8333 }, { "epoch": 0.23, "learning_rate": 1.802131017739076e-05, "loss": 1.3313, "step": 8334 }, { "epoch": 0.23, "learning_rate": 1.8020781964240308e-05, "loss": 1.3813, "step": 8335 }, { "epoch": 0.23, "learning_rate": 1.802025368833903e-05, "loss": 1.3845, "step": 8336 }, { "epoch": 0.23, "learning_rate": 1.801972534969106e-05, "loss": 1.3552, "step": 8337 }, { "epoch": 0.23, "learning_rate": 1.8019196948300528e-05, "loss": 1.5439, "step": 8338 }, { "epoch": 0.23, "learning_rate": 1.801866848417157e-05, "loss": 1.4077, "step": 8339 }, { "epoch": 0.23, "learning_rate": 1.8018139957308322e-05, "loss": 1.2168, "step": 8340 }, { "epoch": 0.23, "learning_rate": 1.8017611367714914e-05, "loss": 1.355, "step": 8341 }, { "epoch": 0.23, "learning_rate": 1.8017082715395487e-05, "loss": 1.4521, "step": 8342 }, { "epoch": 0.23, "learning_rate": 1.8016554000354175e-05, "loss": 1.5127, "step": 8343 }, { "epoch": 0.23, "learning_rate": 1.801602522259512e-05, "loss": 1.2864, "step": 8344 }, { "epoch": 0.23, "learning_rate": 1.801549638212244e-05, "loss": 1.4573, "step": 8345 }, { "epoch": 0.23, "learning_rate": 1.8014967478940295e-05, "loss": 1.4355, "step": 8346 }, { "epoch": 0.23, "learning_rate": 1.8014438513052812e-05, "loss": 1.4419, "step": 8347 }, { "epoch": 0.23, "learning_rate": 1.8013909484464128e-05, "loss": 1.6104, "step": 8348 }, { "epoch": 0.23, "learning_rate": 1.8013380393178387e-05, "loss": 1.3718, "step": 8349 }, { "epoch": 0.23, "learning_rate": 1.8012851239199727e-05, "loss": 1.4014, "step": 8350 }, { "epoch": 0.23, "learning_rate": 1.8012322022532283e-05, "loss": 1.4312, "step": 8351 }, { "epoch": 0.23, "learning_rate": 1.8011792743180203e-05, "loss": 1.3213, "step": 8352 }, { "epoch": 0.23, "learning_rate": 1.801126340114762e-05, "loss": 1.3582, "step": 8353 }, { "epoch": 0.23, "learning_rate": 1.8010733996438684e-05, "loss": 1.437, "step": 8354 }, { "epoch": 0.23, "learning_rate": 1.8010204529057528e-05, "loss": 1.3979, "step": 8355 }, { "epoch": 0.23, "learning_rate": 1.8009674999008304e-05, "loss": 1.5291, "step": 8356 }, { "epoch": 0.23, "learning_rate": 1.800914540629514e-05, "loss": 1.2634, "step": 8357 }, { "epoch": 0.23, "learning_rate": 1.8008615750922196e-05, "loss": 1.3745, "step": 8358 }, { "epoch": 0.23, "learning_rate": 1.8008086032893606e-05, "loss": 1.3911, "step": 8359 }, { "epoch": 0.23, "learning_rate": 1.8007556252213516e-05, "loss": 1.2844, "step": 8360 }, { "epoch": 0.23, "learning_rate": 1.8007026408886073e-05, "loss": 1.54, "step": 8361 }, { "epoch": 0.23, "learning_rate": 1.8006496502915418e-05, "loss": 1.5122, "step": 8362 }, { "epoch": 0.23, "learning_rate": 1.80059665343057e-05, "loss": 1.2986, "step": 8363 }, { "epoch": 0.23, "learning_rate": 1.8005436503061067e-05, "loss": 1.5039, "step": 8364 }, { "epoch": 0.23, "learning_rate": 1.800490640918566e-05, "loss": 1.2104, "step": 8365 }, { "epoch": 0.23, "learning_rate": 1.800437625268363e-05, "loss": 1.3372, "step": 8366 }, { "epoch": 0.23, "learning_rate": 1.8003846033559128e-05, "loss": 1.3467, "step": 8367 }, { "epoch": 0.23, "learning_rate": 1.8003315751816295e-05, "loss": 1.3984, "step": 8368 }, { "epoch": 0.23, "learning_rate": 1.8002785407459282e-05, "loss": 1.3267, "step": 8369 }, { "epoch": 0.23, "learning_rate": 1.800225500049224e-05, "loss": 1.3428, "step": 8370 }, { "epoch": 0.23, "learning_rate": 1.800172453091932e-05, "loss": 1.3723, "step": 8371 }, { "epoch": 0.23, "learning_rate": 1.8001193998744667e-05, "loss": 1.2898, "step": 8372 }, { "epoch": 0.23, "learning_rate": 1.8000663403972436e-05, "loss": 1.3462, "step": 8373 }, { "epoch": 0.23, "learning_rate": 1.8000132746606778e-05, "loss": 1.3115, "step": 8374 }, { "epoch": 0.23, "learning_rate": 1.799960202665184e-05, "loss": 1.3638, "step": 8375 }, { "epoch": 0.23, "learning_rate": 1.799907124411178e-05, "loss": 1.4077, "step": 8376 }, { "epoch": 0.23, "learning_rate": 1.7998540398990746e-05, "loss": 1.4463, "step": 8377 }, { "epoch": 0.23, "learning_rate": 1.7998009491292893e-05, "loss": 1.282, "step": 8378 }, { "epoch": 0.23, "learning_rate": 1.7997478521022378e-05, "loss": 1.3726, "step": 8379 }, { "epoch": 0.23, "learning_rate": 1.799694748818335e-05, "loss": 1.4524, "step": 8380 }, { "epoch": 0.23, "learning_rate": 1.7996416392779965e-05, "loss": 1.354, "step": 8381 }, { "epoch": 0.23, "learning_rate": 1.799588523481638e-05, "loss": 1.2878, "step": 8382 }, { "epoch": 0.23, "learning_rate": 1.7995354014296745e-05, "loss": 1.4072, "step": 8383 }, { "epoch": 0.23, "learning_rate": 1.7994822731225223e-05, "loss": 1.3162, "step": 8384 }, { "epoch": 0.23, "learning_rate": 1.7994291385605966e-05, "loss": 1.4243, "step": 8385 }, { "epoch": 0.23, "learning_rate": 1.7993759977443134e-05, "loss": 1.4595, "step": 8386 }, { "epoch": 0.23, "learning_rate": 1.799322850674088e-05, "loss": 1.3252, "step": 8387 }, { "epoch": 0.23, "learning_rate": 1.7992696973503366e-05, "loss": 1.3789, "step": 8388 }, { "epoch": 0.23, "learning_rate": 1.799216537773475e-05, "loss": 1.3455, "step": 8389 }, { "epoch": 0.23, "learning_rate": 1.799163371943919e-05, "loss": 1.3826, "step": 8390 }, { "epoch": 0.23, "learning_rate": 1.7991101998620844e-05, "loss": 1.3574, "step": 8391 }, { "epoch": 0.23, "learning_rate": 1.7990570215283877e-05, "loss": 1.3359, "step": 8392 }, { "epoch": 0.23, "learning_rate": 1.7990038369432447e-05, "loss": 1.417, "step": 8393 }, { "epoch": 0.23, "learning_rate": 1.798950646107071e-05, "loss": 1.1917, "step": 8394 }, { "epoch": 0.23, "learning_rate": 1.798897449020283e-05, "loss": 1.2241, "step": 8395 }, { "epoch": 0.23, "learning_rate": 1.7988442456832977e-05, "loss": 1.355, "step": 8396 }, { "epoch": 0.23, "learning_rate": 1.79879103609653e-05, "loss": 1.3181, "step": 8397 }, { "epoch": 0.23, "learning_rate": 1.7987378202603972e-05, "loss": 1.4353, "step": 8398 }, { "epoch": 0.23, "learning_rate": 1.7986845981753153e-05, "loss": 1.4448, "step": 8399 }, { "epoch": 0.23, "learning_rate": 1.7986313698417005e-05, "loss": 1.4124, "step": 8400 }, { "epoch": 0.23, "learning_rate": 1.7985781352599695e-05, "loss": 1.4336, "step": 8401 }, { "epoch": 0.23, "learning_rate": 1.7985248944305387e-05, "loss": 1.4731, "step": 8402 }, { "epoch": 0.23, "learning_rate": 1.7984716473538246e-05, "loss": 1.3347, "step": 8403 }, { "epoch": 0.23, "learning_rate": 1.798418394030244e-05, "loss": 1.2983, "step": 8404 }, { "epoch": 0.23, "learning_rate": 1.798365134460213e-05, "loss": 1.3928, "step": 8405 }, { "epoch": 0.23, "learning_rate": 1.7983118686441487e-05, "loss": 1.3132, "step": 8406 }, { "epoch": 0.23, "learning_rate": 1.7982585965824678e-05, "loss": 1.4136, "step": 8407 }, { "epoch": 0.23, "learning_rate": 1.798205318275587e-05, "loss": 1.6685, "step": 8408 }, { "epoch": 0.23, "learning_rate": 1.798152033723923e-05, "loss": 1.4233, "step": 8409 }, { "epoch": 0.23, "learning_rate": 1.798098742927893e-05, "loss": 1.3835, "step": 8410 }, { "epoch": 0.23, "learning_rate": 1.7980454458879136e-05, "loss": 1.4756, "step": 8411 }, { "epoch": 0.23, "learning_rate": 1.797992142604402e-05, "loss": 1.4019, "step": 8412 }, { "epoch": 0.23, "learning_rate": 1.7979388330777753e-05, "loss": 1.356, "step": 8413 }, { "epoch": 0.23, "learning_rate": 1.79788551730845e-05, "loss": 1.3325, "step": 8414 }, { "epoch": 0.23, "learning_rate": 1.7978321952968435e-05, "loss": 1.2451, "step": 8415 }, { "epoch": 0.23, "learning_rate": 1.7977788670433733e-05, "loss": 1.4653, "step": 8416 }, { "epoch": 0.23, "learning_rate": 1.7977255325484565e-05, "loss": 1.4272, "step": 8417 }, { "epoch": 0.23, "learning_rate": 1.79767219181251e-05, "loss": 1.4312, "step": 8418 }, { "epoch": 0.23, "learning_rate": 1.7976188448359516e-05, "loss": 1.4297, "step": 8419 }, { "epoch": 0.23, "learning_rate": 1.7975654916191983e-05, "loss": 1.3442, "step": 8420 }, { "epoch": 0.23, "learning_rate": 1.7975121321626678e-05, "loss": 1.2241, "step": 8421 }, { "epoch": 0.23, "learning_rate": 1.7974587664667774e-05, "loss": 1.4087, "step": 8422 }, { "epoch": 0.23, "learning_rate": 1.7974053945319445e-05, "loss": 1.3484, "step": 8423 }, { "epoch": 0.23, "learning_rate": 1.797352016358587e-05, "loss": 1.3423, "step": 8424 }, { "epoch": 0.23, "learning_rate": 1.7972986319471216e-05, "loss": 1.5337, "step": 8425 }, { "epoch": 0.23, "learning_rate": 1.797245241297967e-05, "loss": 1.3135, "step": 8426 }, { "epoch": 0.23, "learning_rate": 1.7971918444115406e-05, "loss": 1.342, "step": 8427 }, { "epoch": 0.23, "learning_rate": 1.79713844128826e-05, "loss": 1.4048, "step": 8428 }, { "epoch": 0.23, "learning_rate": 1.797085031928543e-05, "loss": 1.333, "step": 8429 }, { "epoch": 0.23, "learning_rate": 1.7970316163328078e-05, "loss": 1.4272, "step": 8430 }, { "epoch": 0.23, "learning_rate": 1.7969781945014717e-05, "loss": 1.2532, "step": 8431 }, { "epoch": 0.23, "learning_rate": 1.7969247664349532e-05, "loss": 1.3813, "step": 8432 }, { "epoch": 0.23, "learning_rate": 1.79687133213367e-05, "loss": 1.3452, "step": 8433 }, { "epoch": 0.23, "learning_rate": 1.79681789159804e-05, "loss": 1.3218, "step": 8434 }, { "epoch": 0.23, "learning_rate": 1.796764444828482e-05, "loss": 1.3813, "step": 8435 }, { "epoch": 0.23, "learning_rate": 1.796710991825413e-05, "loss": 1.417, "step": 8436 }, { "epoch": 0.23, "learning_rate": 1.7966575325892525e-05, "loss": 1.4192, "step": 8437 }, { "epoch": 0.23, "learning_rate": 1.7966040671204178e-05, "loss": 1.3794, "step": 8438 }, { "epoch": 0.23, "learning_rate": 1.796550595419327e-05, "loss": 1.1433, "step": 8439 }, { "epoch": 0.23, "learning_rate": 1.7964971174863998e-05, "loss": 1.385, "step": 8440 }, { "epoch": 0.23, "learning_rate": 1.796443633322053e-05, "loss": 1.4341, "step": 8441 }, { "epoch": 0.23, "learning_rate": 1.796390142926706e-05, "loss": 1.4412, "step": 8442 }, { "epoch": 0.23, "learning_rate": 1.796336646300777e-05, "loss": 1.3716, "step": 8443 }, { "epoch": 0.23, "learning_rate": 1.7962831434446846e-05, "loss": 1.3728, "step": 8444 }, { "epoch": 0.23, "learning_rate": 1.796229634358847e-05, "loss": 1.3987, "step": 8445 }, { "epoch": 0.23, "learning_rate": 1.7961761190436837e-05, "loss": 1.2729, "step": 8446 }, { "epoch": 0.23, "learning_rate": 1.7961225974996127e-05, "loss": 1.6274, "step": 8447 }, { "epoch": 0.23, "learning_rate": 1.7960690697270524e-05, "loss": 1.3809, "step": 8448 }, { "epoch": 0.23, "learning_rate": 1.7960155357264224e-05, "loss": 1.4321, "step": 8449 }, { "epoch": 0.23, "learning_rate": 1.795961995498141e-05, "loss": 1.2092, "step": 8450 }, { "epoch": 0.23, "learning_rate": 1.7959084490426274e-05, "loss": 1.3748, "step": 8451 }, { "epoch": 0.23, "learning_rate": 1.7958548963603003e-05, "loss": 1.5408, "step": 8452 }, { "epoch": 0.23, "learning_rate": 1.7958013374515786e-05, "loss": 1.4209, "step": 8453 }, { "epoch": 0.23, "learning_rate": 1.7957477723168818e-05, "loss": 1.4314, "step": 8454 }, { "epoch": 0.23, "learning_rate": 1.795694200956628e-05, "loss": 1.4976, "step": 8455 }, { "epoch": 0.23, "learning_rate": 1.7956406233712375e-05, "loss": 1.4321, "step": 8456 }, { "epoch": 0.23, "learning_rate": 1.7955870395611285e-05, "loss": 1.5801, "step": 8457 }, { "epoch": 0.23, "learning_rate": 1.7955334495267212e-05, "loss": 1.2227, "step": 8458 }, { "epoch": 0.23, "learning_rate": 1.7954798532684337e-05, "loss": 1.3276, "step": 8459 }, { "epoch": 0.23, "learning_rate": 1.7954262507866862e-05, "loss": 1.3633, "step": 8460 }, { "epoch": 0.23, "learning_rate": 1.7953726420818977e-05, "loss": 1.23, "step": 8461 }, { "epoch": 0.23, "learning_rate": 1.7953190271544874e-05, "loss": 1.3599, "step": 8462 }, { "epoch": 0.23, "learning_rate": 1.7952654060048753e-05, "loss": 1.364, "step": 8463 }, { "epoch": 0.23, "learning_rate": 1.7952117786334807e-05, "loss": 1.4485, "step": 8464 }, { "epoch": 0.23, "learning_rate": 1.7951581450407226e-05, "loss": 1.2661, "step": 8465 }, { "epoch": 0.23, "learning_rate": 1.7951045052270215e-05, "loss": 1.2878, "step": 8466 }, { "epoch": 0.23, "learning_rate": 1.7950508591927964e-05, "loss": 1.4155, "step": 8467 }, { "epoch": 0.23, "learning_rate": 1.7949972069384673e-05, "loss": 1.4192, "step": 8468 }, { "epoch": 0.23, "learning_rate": 1.794943548464454e-05, "loss": 1.7095, "step": 8469 }, { "epoch": 0.23, "learning_rate": 1.7948898837711764e-05, "loss": 1.4524, "step": 8470 }, { "epoch": 0.23, "learning_rate": 1.7948362128590537e-05, "loss": 1.3828, "step": 8471 }, { "epoch": 0.23, "learning_rate": 1.7947825357285066e-05, "loss": 1.4194, "step": 8472 }, { "epoch": 0.23, "learning_rate": 1.7947288523799544e-05, "loss": 1.3152, "step": 8473 }, { "epoch": 0.23, "learning_rate": 1.7946751628138175e-05, "loss": 1.4204, "step": 8474 }, { "epoch": 0.23, "learning_rate": 1.7946214670305157e-05, "loss": 1.3352, "step": 8475 }, { "epoch": 0.23, "learning_rate": 1.794567765030469e-05, "loss": 1.4353, "step": 8476 }, { "epoch": 0.23, "learning_rate": 1.794514056814098e-05, "loss": 1.375, "step": 8477 }, { "epoch": 0.23, "learning_rate": 1.7944603423818227e-05, "loss": 1.1689, "step": 8478 }, { "epoch": 0.23, "learning_rate": 1.794406621734063e-05, "loss": 1.3333, "step": 8479 }, { "epoch": 0.23, "learning_rate": 1.79435289487124e-05, "loss": 1.3979, "step": 8480 }, { "epoch": 0.23, "learning_rate": 1.7942991617937728e-05, "loss": 1.3911, "step": 8481 }, { "epoch": 0.23, "learning_rate": 1.794245422502083e-05, "loss": 1.3074, "step": 8482 }, { "epoch": 0.23, "learning_rate": 1.79419167699659e-05, "loss": 1.2456, "step": 8483 }, { "epoch": 0.23, "learning_rate": 1.7941379252777152e-05, "loss": 1.4065, "step": 8484 }, { "epoch": 0.23, "learning_rate": 1.7940841673458788e-05, "loss": 1.5034, "step": 8485 }, { "epoch": 0.23, "learning_rate": 1.794030403201501e-05, "loss": 1.4839, "step": 8486 }, { "epoch": 0.23, "learning_rate": 1.7939766328450026e-05, "loss": 1.4771, "step": 8487 }, { "epoch": 0.23, "learning_rate": 1.7939228562768046e-05, "loss": 1.4629, "step": 8488 }, { "epoch": 0.23, "learning_rate": 1.7938690734973274e-05, "loss": 1.3066, "step": 8489 }, { "epoch": 0.23, "learning_rate": 1.7938152845069917e-05, "loss": 1.4644, "step": 8490 }, { "epoch": 0.23, "learning_rate": 1.793761489306219e-05, "loss": 1.3083, "step": 8491 }, { "epoch": 0.23, "learning_rate": 1.793707687895429e-05, "loss": 1.3071, "step": 8492 }, { "epoch": 0.23, "learning_rate": 1.7936538802750435e-05, "loss": 1.3123, "step": 8493 }, { "epoch": 0.23, "learning_rate": 1.7936000664454835e-05, "loss": 1.2576, "step": 8494 }, { "epoch": 0.23, "learning_rate": 1.7935462464071697e-05, "loss": 1.3784, "step": 8495 }, { "epoch": 0.23, "learning_rate": 1.793492420160523e-05, "loss": 1.3503, "step": 8496 }, { "epoch": 0.23, "learning_rate": 1.793438587705965e-05, "loss": 1.5718, "step": 8497 }, { "epoch": 0.23, "learning_rate": 1.7933847490439164e-05, "loss": 1.3958, "step": 8498 }, { "epoch": 0.23, "learning_rate": 1.7933309041747985e-05, "loss": 1.4189, "step": 8499 }, { "epoch": 0.23, "learning_rate": 1.7932770530990328e-05, "loss": 1.4453, "step": 8500 }, { "epoch": 0.23, "learning_rate": 1.7932231958170408e-05, "loss": 1.3345, "step": 8501 }, { "epoch": 0.23, "learning_rate": 1.793169332329243e-05, "loss": 1.3296, "step": 8502 }, { "epoch": 0.23, "learning_rate": 1.7931154626360613e-05, "loss": 1.3962, "step": 8503 }, { "epoch": 0.23, "learning_rate": 1.7930615867379175e-05, "loss": 1.3879, "step": 8504 }, { "epoch": 0.23, "learning_rate": 1.7930077046352326e-05, "loss": 1.2786, "step": 8505 }, { "epoch": 0.23, "learning_rate": 1.7929538163284285e-05, "loss": 1.1614, "step": 8506 }, { "epoch": 0.23, "learning_rate": 1.7928999218179263e-05, "loss": 1.3137, "step": 8507 }, { "epoch": 0.23, "learning_rate": 1.7928460211041484e-05, "loss": 1.7354, "step": 8508 }, { "epoch": 0.23, "learning_rate": 1.7927921141875155e-05, "loss": 1.3442, "step": 8509 }, { "epoch": 0.23, "learning_rate": 1.7927382010684505e-05, "loss": 1.3523, "step": 8510 }, { "epoch": 0.23, "learning_rate": 1.792684281747374e-05, "loss": 1.2039, "step": 8511 }, { "epoch": 0.23, "learning_rate": 1.792630356224709e-05, "loss": 1.2834, "step": 8512 }, { "epoch": 0.23, "learning_rate": 1.7925764245008764e-05, "loss": 1.2957, "step": 8513 }, { "epoch": 0.23, "learning_rate": 1.7925224865762985e-05, "loss": 1.3159, "step": 8514 }, { "epoch": 0.23, "learning_rate": 1.7924685424513977e-05, "loss": 1.5317, "step": 8515 }, { "epoch": 0.23, "learning_rate": 1.7924145921265956e-05, "loss": 1.3792, "step": 8516 }, { "epoch": 0.23, "learning_rate": 1.792360635602314e-05, "loss": 1.4485, "step": 8517 }, { "epoch": 0.23, "learning_rate": 1.7923066728789755e-05, "loss": 1.1926, "step": 8518 }, { "epoch": 0.23, "learning_rate": 1.7922527039570022e-05, "loss": 1.2485, "step": 8519 }, { "epoch": 0.23, "learning_rate": 1.7921987288368162e-05, "loss": 1.1898, "step": 8520 }, { "epoch": 0.23, "learning_rate": 1.7921447475188403e-05, "loss": 1.5605, "step": 8521 }, { "epoch": 0.23, "learning_rate": 1.792090760003496e-05, "loss": 1.5391, "step": 8522 }, { "epoch": 0.23, "learning_rate": 1.7920367662912062e-05, "loss": 1.4126, "step": 8523 }, { "epoch": 0.23, "learning_rate": 1.7919827663823934e-05, "loss": 1.4092, "step": 8524 }, { "epoch": 0.23, "learning_rate": 1.7919287602774792e-05, "loss": 1.2534, "step": 8525 }, { "epoch": 0.23, "learning_rate": 1.791874747976887e-05, "loss": 1.7588, "step": 8526 }, { "epoch": 0.23, "learning_rate": 1.7918207294810396e-05, "loss": 1.3164, "step": 8527 }, { "epoch": 0.23, "learning_rate": 1.7917667047903585e-05, "loss": 1.4385, "step": 8528 }, { "epoch": 0.23, "learning_rate": 1.791712673905268e-05, "loss": 1.4375, "step": 8529 }, { "epoch": 0.23, "learning_rate": 1.7916586368261888e-05, "loss": 1.2891, "step": 8530 }, { "epoch": 0.23, "learning_rate": 1.791604593553545e-05, "loss": 1.4131, "step": 8531 }, { "epoch": 0.23, "learning_rate": 1.7915505440877595e-05, "loss": 1.3818, "step": 8532 }, { "epoch": 0.23, "learning_rate": 1.7914964884292543e-05, "loss": 1.4565, "step": 8533 }, { "epoch": 0.23, "learning_rate": 1.7914424265784527e-05, "loss": 1.4028, "step": 8534 }, { "epoch": 0.23, "learning_rate": 1.791388358535778e-05, "loss": 1.47, "step": 8535 }, { "epoch": 0.23, "learning_rate": 1.791334284301653e-05, "loss": 1.3657, "step": 8536 }, { "epoch": 0.23, "learning_rate": 1.7912802038765006e-05, "loss": 1.3396, "step": 8537 }, { "epoch": 0.23, "learning_rate": 1.7912261172607437e-05, "loss": 1.4888, "step": 8538 }, { "epoch": 0.23, "learning_rate": 1.791172024454806e-05, "loss": 1.3149, "step": 8539 }, { "epoch": 0.23, "learning_rate": 1.7911179254591102e-05, "loss": 1.5508, "step": 8540 }, { "epoch": 0.23, "learning_rate": 1.7910638202740797e-05, "loss": 1.1401, "step": 8541 }, { "epoch": 0.23, "learning_rate": 1.7910097089001382e-05, "loss": 1.4675, "step": 8542 }, { "epoch": 0.23, "learning_rate": 1.7909555913377086e-05, "loss": 1.2539, "step": 8543 }, { "epoch": 0.23, "learning_rate": 1.790901467587214e-05, "loss": 1.3047, "step": 8544 }, { "epoch": 0.23, "learning_rate": 1.790847337649079e-05, "loss": 1.4363, "step": 8545 }, { "epoch": 0.23, "learning_rate": 1.7907932015237258e-05, "loss": 1.3977, "step": 8546 }, { "epoch": 0.23, "learning_rate": 1.7907390592115783e-05, "loss": 1.4568, "step": 8547 }, { "epoch": 0.23, "learning_rate": 1.7906849107130603e-05, "loss": 1.2896, "step": 8548 }, { "epoch": 0.23, "learning_rate": 1.7906307560285956e-05, "loss": 1.2659, "step": 8549 }, { "epoch": 0.23, "learning_rate": 1.7905765951586074e-05, "loss": 1.4866, "step": 8550 }, { "epoch": 0.23, "learning_rate": 1.79052242810352e-05, "loss": 1.384, "step": 8551 }, { "epoch": 0.23, "learning_rate": 1.7904682548637567e-05, "loss": 1.3374, "step": 8552 }, { "epoch": 0.23, "learning_rate": 1.7904140754397416e-05, "loss": 1.4763, "step": 8553 }, { "epoch": 0.23, "learning_rate": 1.790359889831898e-05, "loss": 1.3491, "step": 8554 }, { "epoch": 0.23, "learning_rate": 1.790305698040651e-05, "loss": 1.3967, "step": 8555 }, { "epoch": 0.23, "learning_rate": 1.790251500066423e-05, "loss": 1.3335, "step": 8556 }, { "epoch": 0.23, "learning_rate": 1.7901972959096398e-05, "loss": 1.4409, "step": 8557 }, { "epoch": 0.23, "learning_rate": 1.7901430855707235e-05, "loss": 1.364, "step": 8558 }, { "epoch": 0.23, "learning_rate": 1.7900888690500998e-05, "loss": 1.1316, "step": 8559 }, { "epoch": 0.23, "learning_rate": 1.7900346463481922e-05, "loss": 1.4285, "step": 8560 }, { "epoch": 0.23, "learning_rate": 1.7899804174654255e-05, "loss": 1.3323, "step": 8561 }, { "epoch": 0.23, "learning_rate": 1.7899261824022233e-05, "loss": 1.3054, "step": 8562 }, { "epoch": 0.23, "learning_rate": 1.7898719411590098e-05, "loss": 1.2866, "step": 8563 }, { "epoch": 0.23, "learning_rate": 1.7898176937362094e-05, "loss": 1.7456, "step": 8564 }, { "epoch": 0.23, "learning_rate": 1.789763440134247e-05, "loss": 1.4834, "step": 8565 }, { "epoch": 0.23, "learning_rate": 1.789709180353547e-05, "loss": 1.3481, "step": 8566 }, { "epoch": 0.23, "learning_rate": 1.789654914394534e-05, "loss": 1.3899, "step": 8567 }, { "epoch": 0.23, "learning_rate": 1.7896006422576317e-05, "loss": 1.4092, "step": 8568 }, { "epoch": 0.23, "learning_rate": 1.7895463639432657e-05, "loss": 1.3328, "step": 8569 }, { "epoch": 0.23, "learning_rate": 1.78949207945186e-05, "loss": 1.6885, "step": 8570 }, { "epoch": 0.23, "learning_rate": 1.7894377887838393e-05, "loss": 1.4458, "step": 8571 }, { "epoch": 0.23, "learning_rate": 1.7893834919396288e-05, "loss": 1.3994, "step": 8572 }, { "epoch": 0.23, "learning_rate": 1.7893291889196532e-05, "loss": 1.3494, "step": 8573 }, { "epoch": 0.23, "learning_rate": 1.7892748797243372e-05, "loss": 1.2891, "step": 8574 }, { "epoch": 0.23, "learning_rate": 1.7892205643541056e-05, "loss": 1.4224, "step": 8575 }, { "epoch": 0.23, "learning_rate": 1.7891662428093832e-05, "loss": 1.3425, "step": 8576 }, { "epoch": 0.23, "learning_rate": 1.7891119150905954e-05, "loss": 1.3071, "step": 8577 }, { "epoch": 0.23, "learning_rate": 1.789057581198167e-05, "loss": 1.4375, "step": 8578 }, { "epoch": 0.23, "learning_rate": 1.789003241132523e-05, "loss": 1.4434, "step": 8579 }, { "epoch": 0.23, "learning_rate": 1.7889488948940886e-05, "loss": 1.2405, "step": 8580 }, { "epoch": 0.23, "learning_rate": 1.7888945424832896e-05, "loss": 1.469, "step": 8581 }, { "epoch": 0.23, "learning_rate": 1.78884018390055e-05, "loss": 1.187, "step": 8582 }, { "epoch": 0.23, "learning_rate": 1.7887858191462962e-05, "loss": 1.3594, "step": 8583 }, { "epoch": 0.23, "learning_rate": 1.7887314482209527e-05, "loss": 1.3784, "step": 8584 }, { "epoch": 0.23, "learning_rate": 1.7886770711249453e-05, "loss": 1.5298, "step": 8585 }, { "epoch": 0.23, "learning_rate": 1.7886226878586997e-05, "loss": 1.2878, "step": 8586 }, { "epoch": 0.23, "learning_rate": 1.7885682984226407e-05, "loss": 1.4355, "step": 8587 }, { "epoch": 0.23, "learning_rate": 1.7885139028171946e-05, "loss": 1.1479, "step": 8588 }, { "epoch": 0.23, "learning_rate": 1.788459501042786e-05, "loss": 1.2874, "step": 8589 }, { "epoch": 0.23, "learning_rate": 1.7884050930998412e-05, "loss": 1.4878, "step": 8590 }, { "epoch": 0.23, "learning_rate": 1.7883506789887858e-05, "loss": 1.7666, "step": 8591 }, { "epoch": 0.23, "learning_rate": 1.788296258710045e-05, "loss": 1.3291, "step": 8592 }, { "epoch": 0.23, "learning_rate": 1.7882418322640453e-05, "loss": 1.4561, "step": 8593 }, { "epoch": 0.23, "learning_rate": 1.788187399651212e-05, "loss": 1.4084, "step": 8594 }, { "epoch": 0.23, "learning_rate": 1.7881329608719713e-05, "loss": 1.4192, "step": 8595 }, { "epoch": 0.23, "learning_rate": 1.7880785159267485e-05, "loss": 1.3762, "step": 8596 }, { "epoch": 0.23, "learning_rate": 1.7880240648159706e-05, "loss": 1.4988, "step": 8597 }, { "epoch": 0.23, "learning_rate": 1.7879696075400627e-05, "loss": 1.3215, "step": 8598 }, { "epoch": 0.23, "learning_rate": 1.787915144099451e-05, "loss": 1.3921, "step": 8599 }, { "epoch": 0.23, "learning_rate": 1.7878606744945618e-05, "loss": 1.5432, "step": 8600 }, { "epoch": 0.23, "learning_rate": 1.7878061987258212e-05, "loss": 1.3865, "step": 8601 }, { "epoch": 0.23, "learning_rate": 1.7877517167936553e-05, "loss": 1.1899, "step": 8602 }, { "epoch": 0.23, "learning_rate": 1.7876972286984905e-05, "loss": 1.3972, "step": 8603 }, { "epoch": 0.23, "learning_rate": 1.7876427344407528e-05, "loss": 1.4272, "step": 8604 }, { "epoch": 0.23, "learning_rate": 1.787588234020869e-05, "loss": 1.4695, "step": 8605 }, { "epoch": 0.24, "learning_rate": 1.7875337274392646e-05, "loss": 1.3459, "step": 8606 }, { "epoch": 0.24, "learning_rate": 1.7874792146963674e-05, "loss": 1.4263, "step": 8607 }, { "epoch": 0.24, "learning_rate": 1.7874246957926028e-05, "loss": 1.4517, "step": 8608 }, { "epoch": 0.24, "learning_rate": 1.7873701707283974e-05, "loss": 1.4727, "step": 8609 }, { "epoch": 0.24, "learning_rate": 1.7873156395041787e-05, "loss": 1.3438, "step": 8610 }, { "epoch": 0.24, "learning_rate": 1.7872611021203717e-05, "loss": 1.2166, "step": 8611 }, { "epoch": 0.24, "learning_rate": 1.7872065585774046e-05, "loss": 1.2292, "step": 8612 }, { "epoch": 0.24, "learning_rate": 1.7871520088757036e-05, "loss": 1.1956, "step": 8613 }, { "epoch": 0.24, "learning_rate": 1.7870974530156954e-05, "loss": 1.2581, "step": 8614 }, { "epoch": 0.24, "learning_rate": 1.7870428909978067e-05, "loss": 1.4397, "step": 8615 }, { "epoch": 0.24, "learning_rate": 1.786988322822465e-05, "loss": 1.5349, "step": 8616 }, { "epoch": 0.24, "learning_rate": 1.786933748490096e-05, "loss": 1.3711, "step": 8617 }, { "epoch": 0.24, "learning_rate": 1.786879168001128e-05, "loss": 1.3757, "step": 8618 }, { "epoch": 0.24, "learning_rate": 1.786824581355987e-05, "loss": 1.3857, "step": 8619 }, { "epoch": 0.24, "learning_rate": 1.7867699885551007e-05, "loss": 1.262, "step": 8620 }, { "epoch": 0.24, "learning_rate": 1.786715389598896e-05, "loss": 1.2642, "step": 8621 }, { "epoch": 0.24, "learning_rate": 1.7866607844877996e-05, "loss": 1.3901, "step": 8622 }, { "epoch": 0.24, "learning_rate": 1.7866061732222397e-05, "loss": 1.3762, "step": 8623 }, { "epoch": 0.24, "learning_rate": 1.786551555802643e-05, "loss": 1.2625, "step": 8624 }, { "epoch": 0.24, "learning_rate": 1.786496932229436e-05, "loss": 1.8779, "step": 8625 }, { "epoch": 0.24, "learning_rate": 1.7864423025030475e-05, "loss": 1.2417, "step": 8626 }, { "epoch": 0.24, "learning_rate": 1.786387666623904e-05, "loss": 1.3154, "step": 8627 }, { "epoch": 0.24, "learning_rate": 1.7863330245924335e-05, "loss": 1.459, "step": 8628 }, { "epoch": 0.24, "learning_rate": 1.786278376409063e-05, "loss": 1.5283, "step": 8629 }, { "epoch": 0.24, "learning_rate": 1.78622372207422e-05, "loss": 1.5063, "step": 8630 }, { "epoch": 0.24, "learning_rate": 1.7861690615883326e-05, "loss": 1.4534, "step": 8631 }, { "epoch": 0.24, "learning_rate": 1.786114394951828e-05, "loss": 1.3813, "step": 8632 }, { "epoch": 0.24, "learning_rate": 1.7860597221651343e-05, "loss": 1.4446, "step": 8633 }, { "epoch": 0.24, "learning_rate": 1.7860050432286783e-05, "loss": 1.4329, "step": 8634 }, { "epoch": 0.24, "learning_rate": 1.785950358142889e-05, "loss": 1.3909, "step": 8635 }, { "epoch": 0.24, "learning_rate": 1.7858956669081936e-05, "loss": 1.3447, "step": 8636 }, { "epoch": 0.24, "learning_rate": 1.78584096952502e-05, "loss": 1.3542, "step": 8637 }, { "epoch": 0.24, "learning_rate": 1.7857862659937962e-05, "loss": 1.3796, "step": 8638 }, { "epoch": 0.24, "learning_rate": 1.78573155631495e-05, "loss": 1.3218, "step": 8639 }, { "epoch": 0.24, "learning_rate": 1.78567684048891e-05, "loss": 1.2231, "step": 8640 }, { "epoch": 0.24, "learning_rate": 1.7856221185161034e-05, "loss": 1.2793, "step": 8641 }, { "epoch": 0.24, "learning_rate": 1.785567390396959e-05, "loss": 1.3086, "step": 8642 }, { "epoch": 0.24, "learning_rate": 1.7855126561319046e-05, "loss": 1.3638, "step": 8643 }, { "epoch": 0.24, "learning_rate": 1.785457915721369e-05, "loss": 1.5068, "step": 8644 }, { "epoch": 0.24, "learning_rate": 1.7854031691657794e-05, "loss": 1.4321, "step": 8645 }, { "epoch": 0.24, "learning_rate": 1.7853484164655647e-05, "loss": 1.7144, "step": 8646 }, { "epoch": 0.24, "learning_rate": 1.785293657621154e-05, "loss": 1.4448, "step": 8647 }, { "epoch": 0.24, "learning_rate": 1.7852388926329745e-05, "loss": 1.4592, "step": 8648 }, { "epoch": 0.24, "learning_rate": 1.785184121501455e-05, "loss": 1.3799, "step": 8649 }, { "epoch": 0.24, "learning_rate": 1.7851293442270244e-05, "loss": 1.301, "step": 8650 }, { "epoch": 0.24, "learning_rate": 1.785074560810111e-05, "loss": 1.4375, "step": 8651 }, { "epoch": 0.24, "learning_rate": 1.7850197712511433e-05, "loss": 1.4036, "step": 8652 }, { "epoch": 0.24, "learning_rate": 1.78496497555055e-05, "loss": 1.3376, "step": 8653 }, { "epoch": 0.24, "learning_rate": 1.78491017370876e-05, "loss": 1.4055, "step": 8654 }, { "epoch": 0.24, "learning_rate": 1.784855365726202e-05, "loss": 1.3096, "step": 8655 }, { "epoch": 0.24, "learning_rate": 1.7848005516033047e-05, "loss": 1.2976, "step": 8656 }, { "epoch": 0.24, "learning_rate": 1.784745731340497e-05, "loss": 1.3179, "step": 8657 }, { "epoch": 0.24, "learning_rate": 1.784690904938207e-05, "loss": 1.3806, "step": 8658 }, { "epoch": 0.24, "learning_rate": 1.784636072396865e-05, "loss": 1.4229, "step": 8659 }, { "epoch": 0.24, "learning_rate": 1.784581233716899e-05, "loss": 1.2214, "step": 8660 }, { "epoch": 0.24, "learning_rate": 1.7845263888987386e-05, "loss": 1.4668, "step": 8661 }, { "epoch": 0.24, "learning_rate": 1.7844715379428127e-05, "loss": 1.5115, "step": 8662 }, { "epoch": 0.24, "learning_rate": 1.78441668084955e-05, "loss": 1.4478, "step": 8663 }, { "epoch": 0.24, "learning_rate": 1.7843618176193806e-05, "loss": 1.376, "step": 8664 }, { "epoch": 0.24, "learning_rate": 1.7843069482527325e-05, "loss": 1.3831, "step": 8665 }, { "epoch": 0.24, "learning_rate": 1.7842520727500365e-05, "loss": 1.2793, "step": 8666 }, { "epoch": 0.24, "learning_rate": 1.78419719111172e-05, "loss": 1.4312, "step": 8667 }, { "epoch": 0.24, "learning_rate": 1.7841423033382142e-05, "loss": 1.3691, "step": 8668 }, { "epoch": 0.24, "learning_rate": 1.7840874094299476e-05, "loss": 1.6572, "step": 8669 }, { "epoch": 0.24, "learning_rate": 1.7840325093873498e-05, "loss": 1.2605, "step": 8670 }, { "epoch": 0.24, "learning_rate": 1.7839776032108504e-05, "loss": 1.3892, "step": 8671 }, { "epoch": 0.24, "learning_rate": 1.7839226909008787e-05, "loss": 1.2578, "step": 8672 }, { "epoch": 0.24, "learning_rate": 1.7838677724578644e-05, "loss": 1.384, "step": 8673 }, { "epoch": 0.24, "learning_rate": 1.7838128478822376e-05, "loss": 1.5659, "step": 8674 }, { "epoch": 0.24, "learning_rate": 1.783757917174427e-05, "loss": 1.345, "step": 8675 }, { "epoch": 0.24, "learning_rate": 1.783702980334864e-05, "loss": 1.4111, "step": 8676 }, { "epoch": 0.24, "learning_rate": 1.783648037363977e-05, "loss": 1.3755, "step": 8677 }, { "epoch": 0.24, "learning_rate": 1.783593088262196e-05, "loss": 1.2031, "step": 8678 }, { "epoch": 0.24, "learning_rate": 1.7835381330299512e-05, "loss": 1.2739, "step": 8679 }, { "epoch": 0.24, "learning_rate": 1.7834831716676727e-05, "loss": 1.4209, "step": 8680 }, { "epoch": 0.24, "learning_rate": 1.78342820417579e-05, "loss": 1.4399, "step": 8681 }, { "epoch": 0.24, "learning_rate": 1.7833732305547335e-05, "loss": 1.334, "step": 8682 }, { "epoch": 0.24, "learning_rate": 1.7833182508049333e-05, "loss": 1.4014, "step": 8683 }, { "epoch": 0.24, "learning_rate": 1.7832632649268196e-05, "loss": 1.4651, "step": 8684 }, { "epoch": 0.24, "learning_rate": 1.7832082729208224e-05, "loss": 1.3914, "step": 8685 }, { "epoch": 0.24, "learning_rate": 1.7831532747873715e-05, "loss": 1.3667, "step": 8686 }, { "epoch": 0.24, "learning_rate": 1.783098270526898e-05, "loss": 1.4951, "step": 8687 }, { "epoch": 0.24, "learning_rate": 1.7830432601398318e-05, "loss": 1.4448, "step": 8688 }, { "epoch": 0.24, "learning_rate": 1.7829882436266035e-05, "loss": 1.408, "step": 8689 }, { "epoch": 0.24, "learning_rate": 1.7829332209876434e-05, "loss": 1.3813, "step": 8690 }, { "epoch": 0.24, "learning_rate": 1.7828781922233816e-05, "loss": 1.4751, "step": 8691 }, { "epoch": 0.24, "learning_rate": 1.7828231573342492e-05, "loss": 1.4692, "step": 8692 }, { "epoch": 0.24, "learning_rate": 1.7827681163206766e-05, "loss": 1.4067, "step": 8693 }, { "epoch": 0.24, "learning_rate": 1.782713069183094e-05, "loss": 1.52, "step": 8694 }, { "epoch": 0.24, "learning_rate": 1.7826580159219326e-05, "loss": 1.345, "step": 8695 }, { "epoch": 0.24, "learning_rate": 1.7826029565376228e-05, "loss": 1.3662, "step": 8696 }, { "epoch": 0.24, "learning_rate": 1.7825478910305957e-05, "loss": 1.4353, "step": 8697 }, { "epoch": 0.24, "learning_rate": 1.782492819401282e-05, "loss": 1.4961, "step": 8698 }, { "epoch": 0.24, "learning_rate": 1.7824377416501122e-05, "loss": 1.4084, "step": 8699 }, { "epoch": 0.24, "learning_rate": 1.7823826577775175e-05, "loss": 1.4873, "step": 8700 }, { "epoch": 0.24, "learning_rate": 1.7823275677839286e-05, "loss": 1.2925, "step": 8701 }, { "epoch": 0.24, "learning_rate": 1.782272471669777e-05, "loss": 1.3093, "step": 8702 }, { "epoch": 0.24, "learning_rate": 1.7822173694354933e-05, "loss": 1.3452, "step": 8703 }, { "epoch": 0.24, "learning_rate": 1.7821622610815085e-05, "loss": 1.458, "step": 8704 }, { "epoch": 0.24, "learning_rate": 1.782107146608254e-05, "loss": 1.4146, "step": 8705 }, { "epoch": 0.24, "learning_rate": 1.7820520260161614e-05, "loss": 1.3088, "step": 8706 }, { "epoch": 0.24, "learning_rate": 1.781996899305661e-05, "loss": 1.4116, "step": 8707 }, { "epoch": 0.24, "learning_rate": 1.781941766477185e-05, "loss": 1.3574, "step": 8708 }, { "epoch": 0.24, "learning_rate": 1.781886627531164e-05, "loss": 1.5129, "step": 8709 }, { "epoch": 0.24, "learning_rate": 1.78183148246803e-05, "loss": 1.3628, "step": 8710 }, { "epoch": 0.24, "learning_rate": 1.781776331288214e-05, "loss": 1.3674, "step": 8711 }, { "epoch": 0.24, "learning_rate": 1.7817211739921477e-05, "loss": 1.2083, "step": 8712 }, { "epoch": 0.24, "learning_rate": 1.781666010580262e-05, "loss": 1.1643, "step": 8713 }, { "epoch": 0.24, "learning_rate": 1.7816108410529896e-05, "loss": 1.7246, "step": 8714 }, { "epoch": 0.24, "learning_rate": 1.7815556654107613e-05, "loss": 1.3174, "step": 8715 }, { "epoch": 0.24, "learning_rate": 1.781500483654009e-05, "loss": 1.4099, "step": 8716 }, { "epoch": 0.24, "learning_rate": 1.7814452957831642e-05, "loss": 1.4771, "step": 8717 }, { "epoch": 0.24, "learning_rate": 1.781390101798659e-05, "loss": 1.4551, "step": 8718 }, { "epoch": 0.24, "learning_rate": 1.781334901700925e-05, "loss": 1.3918, "step": 8719 }, { "epoch": 0.24, "learning_rate": 1.7812796954903944e-05, "loss": 1.3823, "step": 8720 }, { "epoch": 0.24, "learning_rate": 1.781224483167499e-05, "loss": 1.2219, "step": 8721 }, { "epoch": 0.24, "learning_rate": 1.78116926473267e-05, "loss": 1.2905, "step": 8722 }, { "epoch": 0.24, "learning_rate": 1.7811140401863403e-05, "loss": 1.262, "step": 8723 }, { "epoch": 0.24, "learning_rate": 1.7810588095289417e-05, "loss": 1.2883, "step": 8724 }, { "epoch": 0.24, "learning_rate": 1.7810035727609064e-05, "loss": 1.2729, "step": 8725 }, { "epoch": 0.24, "learning_rate": 1.780948329882666e-05, "loss": 1.23, "step": 8726 }, { "epoch": 0.24, "learning_rate": 1.780893080894653e-05, "loss": 1.3171, "step": 8727 }, { "epoch": 0.24, "learning_rate": 1.7808378257973005e-05, "loss": 1.3423, "step": 8728 }, { "epoch": 0.24, "learning_rate": 1.7807825645910396e-05, "loss": 1.262, "step": 8729 }, { "epoch": 0.24, "learning_rate": 1.780727297276303e-05, "loss": 1.4175, "step": 8730 }, { "epoch": 0.24, "learning_rate": 1.780672023853523e-05, "loss": 1.2639, "step": 8731 }, { "epoch": 0.24, "learning_rate": 1.7806167443231323e-05, "loss": 1.3291, "step": 8732 }, { "epoch": 0.24, "learning_rate": 1.7805614586855637e-05, "loss": 1.3281, "step": 8733 }, { "epoch": 0.24, "learning_rate": 1.7805061669412486e-05, "loss": 1.3167, "step": 8734 }, { "epoch": 0.24, "learning_rate": 1.7804508690906205e-05, "loss": 1.501, "step": 8735 }, { "epoch": 0.24, "learning_rate": 1.780395565134112e-05, "loss": 1.3508, "step": 8736 }, { "epoch": 0.24, "learning_rate": 1.7803402550721556e-05, "loss": 1.436, "step": 8737 }, { "epoch": 0.24, "learning_rate": 1.780284938905184e-05, "loss": 1.3042, "step": 8738 }, { "epoch": 0.24, "learning_rate": 1.7802296166336295e-05, "loss": 1.4404, "step": 8739 }, { "epoch": 0.24, "learning_rate": 1.780174288257926e-05, "loss": 1.4146, "step": 8740 }, { "epoch": 0.24, "learning_rate": 1.7801189537785052e-05, "loss": 1.3076, "step": 8741 }, { "epoch": 0.24, "learning_rate": 1.7800636131958008e-05, "loss": 1.4185, "step": 8742 }, { "epoch": 0.24, "learning_rate": 1.7800082665102454e-05, "loss": 1.4009, "step": 8743 }, { "epoch": 0.24, "learning_rate": 1.779952913722272e-05, "loss": 1.4526, "step": 8744 }, { "epoch": 0.24, "learning_rate": 1.779897554832314e-05, "loss": 1.4124, "step": 8745 }, { "epoch": 0.24, "learning_rate": 1.7798421898408043e-05, "loss": 1.3433, "step": 8746 }, { "epoch": 0.24, "learning_rate": 1.7797868187481758e-05, "loss": 1.4705, "step": 8747 }, { "epoch": 0.24, "learning_rate": 1.7797314415548623e-05, "loss": 1.428, "step": 8748 }, { "epoch": 0.24, "learning_rate": 1.779676058261296e-05, "loss": 1.4517, "step": 8749 }, { "epoch": 0.24, "learning_rate": 1.7796206688679115e-05, "loss": 1.408, "step": 8750 }, { "epoch": 0.24, "learning_rate": 1.779565273375141e-05, "loss": 1.1072, "step": 8751 }, { "epoch": 0.24, "learning_rate": 1.7795098717834185e-05, "loss": 1.3523, "step": 8752 }, { "epoch": 0.24, "learning_rate": 1.7794544640931773e-05, "loss": 1.3362, "step": 8753 }, { "epoch": 0.24, "learning_rate": 1.7793990503048512e-05, "loss": 1.4033, "step": 8754 }, { "epoch": 0.24, "learning_rate": 1.7793436304188732e-05, "loss": 1.3623, "step": 8755 }, { "epoch": 0.24, "learning_rate": 1.7792882044356772e-05, "loss": 1.53, "step": 8756 }, { "epoch": 0.24, "learning_rate": 1.779232772355697e-05, "loss": 1.3389, "step": 8757 }, { "epoch": 0.24, "learning_rate": 1.7791773341793655e-05, "loss": 1.4526, "step": 8758 }, { "epoch": 0.24, "learning_rate": 1.779121889907117e-05, "loss": 1.3037, "step": 8759 }, { "epoch": 0.24, "learning_rate": 1.7790664395393852e-05, "loss": 1.5361, "step": 8760 }, { "epoch": 0.24, "learning_rate": 1.779010983076604e-05, "loss": 1.5386, "step": 8761 }, { "epoch": 0.24, "learning_rate": 1.778955520519207e-05, "loss": 1.2632, "step": 8762 }, { "epoch": 0.24, "learning_rate": 1.7789000518676287e-05, "loss": 1.5352, "step": 8763 }, { "epoch": 0.24, "learning_rate": 1.7788445771223028e-05, "loss": 1.3193, "step": 8764 }, { "epoch": 0.24, "learning_rate": 1.7787890962836628e-05, "loss": 1.3667, "step": 8765 }, { "epoch": 0.24, "learning_rate": 1.778733609352143e-05, "loss": 1.239, "step": 8766 }, { "epoch": 0.24, "learning_rate": 1.7786781163281777e-05, "loss": 1.5103, "step": 8767 }, { "epoch": 0.24, "learning_rate": 1.778622617212201e-05, "loss": 1.4651, "step": 8768 }, { "epoch": 0.24, "learning_rate": 1.7785671120046472e-05, "loss": 1.354, "step": 8769 }, { "epoch": 0.24, "learning_rate": 1.7785116007059505e-05, "loss": 1.2354, "step": 8770 }, { "epoch": 0.24, "learning_rate": 1.7784560833165452e-05, "loss": 1.4224, "step": 8771 }, { "epoch": 0.24, "learning_rate": 1.7784005598368653e-05, "loss": 1.3943, "step": 8772 }, { "epoch": 0.24, "learning_rate": 1.7783450302673454e-05, "loss": 1.5271, "step": 8773 }, { "epoch": 0.24, "learning_rate": 1.77828949460842e-05, "loss": 1.3633, "step": 8774 }, { "epoch": 0.24, "learning_rate": 1.7782339528605237e-05, "loss": 1.3025, "step": 8775 }, { "epoch": 0.24, "learning_rate": 1.7781784050240908e-05, "loss": 1.4773, "step": 8776 }, { "epoch": 0.24, "learning_rate": 1.778122851099556e-05, "loss": 1.2117, "step": 8777 }, { "epoch": 0.24, "learning_rate": 1.778067291087354e-05, "loss": 1.1904, "step": 8778 }, { "epoch": 0.24, "learning_rate": 1.7780117249879194e-05, "loss": 1.3623, "step": 8779 }, { "epoch": 0.24, "learning_rate": 1.7779561528016868e-05, "loss": 1.2468, "step": 8780 }, { "epoch": 0.24, "learning_rate": 1.777900574529091e-05, "loss": 1.2202, "step": 8781 }, { "epoch": 0.24, "learning_rate": 1.777844990170567e-05, "loss": 1.4138, "step": 8782 }, { "epoch": 0.24, "learning_rate": 1.7777893997265498e-05, "loss": 1.4309, "step": 8783 }, { "epoch": 0.24, "learning_rate": 1.777733803197474e-05, "loss": 1.5151, "step": 8784 }, { "epoch": 0.24, "learning_rate": 1.7776782005837744e-05, "loss": 1.1688, "step": 8785 }, { "epoch": 0.24, "learning_rate": 1.7776225918858864e-05, "loss": 1.2705, "step": 8786 }, { "epoch": 0.24, "learning_rate": 1.777566977104245e-05, "loss": 1.4563, "step": 8787 }, { "epoch": 0.24, "learning_rate": 1.777511356239285e-05, "loss": 1.4319, "step": 8788 }, { "epoch": 0.24, "learning_rate": 1.777455729291442e-05, "loss": 1.4868, "step": 8789 }, { "epoch": 0.24, "learning_rate": 1.7774000962611507e-05, "loss": 1.3965, "step": 8790 }, { "epoch": 0.24, "learning_rate": 1.7773444571488466e-05, "loss": 1.8208, "step": 8791 }, { "epoch": 0.24, "learning_rate": 1.7772888119549652e-05, "loss": 1.3564, "step": 8792 }, { "epoch": 0.24, "learning_rate": 1.7772331606799415e-05, "loss": 1.3682, "step": 8793 }, { "epoch": 0.24, "learning_rate": 1.7771775033242113e-05, "loss": 1.5273, "step": 8794 }, { "epoch": 0.24, "learning_rate": 1.7771218398882095e-05, "loss": 1.2949, "step": 8795 }, { "epoch": 0.24, "learning_rate": 1.7770661703723716e-05, "loss": 1.3943, "step": 8796 }, { "epoch": 0.24, "learning_rate": 1.7770104947771337e-05, "loss": 1.2957, "step": 8797 }, { "epoch": 0.24, "learning_rate": 1.7769548131029313e-05, "loss": 1.4106, "step": 8798 }, { "epoch": 0.24, "learning_rate": 1.7768991253501993e-05, "loss": 1.5337, "step": 8799 }, { "epoch": 0.24, "learning_rate": 1.776843431519374e-05, "loss": 1.4045, "step": 8800 }, { "epoch": 0.24, "learning_rate": 1.776787731610891e-05, "loss": 1.2416, "step": 8801 }, { "epoch": 0.24, "learning_rate": 1.7767320256251864e-05, "loss": 1.4854, "step": 8802 }, { "epoch": 0.24, "learning_rate": 1.7766763135626956e-05, "loss": 1.3979, "step": 8803 }, { "epoch": 0.24, "learning_rate": 1.7766205954238543e-05, "loss": 1.3518, "step": 8804 }, { "epoch": 0.24, "learning_rate": 1.776564871209099e-05, "loss": 1.3804, "step": 8805 }, { "epoch": 0.24, "learning_rate": 1.776509140918865e-05, "loss": 1.2358, "step": 8806 }, { "epoch": 0.24, "learning_rate": 1.7764534045535887e-05, "loss": 1.3469, "step": 8807 }, { "epoch": 0.24, "learning_rate": 1.776397662113706e-05, "loss": 1.4639, "step": 8808 }, { "epoch": 0.24, "learning_rate": 1.776341913599653e-05, "loss": 1.3464, "step": 8809 }, { "epoch": 0.24, "learning_rate": 1.776286159011866e-05, "loss": 1.2576, "step": 8810 }, { "epoch": 0.24, "learning_rate": 1.7762303983507813e-05, "loss": 1.4023, "step": 8811 }, { "epoch": 0.24, "learning_rate": 1.7761746316168348e-05, "loss": 1.4185, "step": 8812 }, { "epoch": 0.24, "learning_rate": 1.776118858810463e-05, "loss": 1.3435, "step": 8813 }, { "epoch": 0.24, "learning_rate": 1.776063079932102e-05, "loss": 1.2998, "step": 8814 }, { "epoch": 0.24, "learning_rate": 1.776007294982189e-05, "loss": 1.2913, "step": 8815 }, { "epoch": 0.24, "learning_rate": 1.7759515039611593e-05, "loss": 1.3875, "step": 8816 }, { "epoch": 0.24, "learning_rate": 1.77589570686945e-05, "loss": 1.3547, "step": 8817 }, { "epoch": 0.24, "learning_rate": 1.7758399037074978e-05, "loss": 1.3479, "step": 8818 }, { "epoch": 0.24, "learning_rate": 1.775784094475739e-05, "loss": 1.1577, "step": 8819 }, { "epoch": 0.24, "learning_rate": 1.7757282791746098e-05, "loss": 1.3677, "step": 8820 }, { "epoch": 0.24, "learning_rate": 1.7756724578045476e-05, "loss": 1.4495, "step": 8821 }, { "epoch": 0.24, "learning_rate": 1.7756166303659887e-05, "loss": 1.2561, "step": 8822 }, { "epoch": 0.24, "learning_rate": 1.77556079685937e-05, "loss": 1.4302, "step": 8823 }, { "epoch": 0.24, "learning_rate": 1.7755049572851285e-05, "loss": 1.1885, "step": 8824 }, { "epoch": 0.24, "learning_rate": 1.775449111643701e-05, "loss": 1.3083, "step": 8825 }, { "epoch": 0.24, "learning_rate": 1.7753932599355242e-05, "loss": 1.2488, "step": 8826 }, { "epoch": 0.24, "learning_rate": 1.775337402161035e-05, "loss": 1.4338, "step": 8827 }, { "epoch": 0.24, "learning_rate": 1.7752815383206706e-05, "loss": 1.4414, "step": 8828 }, { "epoch": 0.24, "learning_rate": 1.775225668414868e-05, "loss": 1.4907, "step": 8829 }, { "epoch": 0.24, "learning_rate": 1.7751697924440642e-05, "loss": 1.4092, "step": 8830 }, { "epoch": 0.24, "learning_rate": 1.7751139104086966e-05, "loss": 1.3545, "step": 8831 }, { "epoch": 0.24, "learning_rate": 1.7750580223092023e-05, "loss": 1.3936, "step": 8832 }, { "epoch": 0.24, "learning_rate": 1.7750021281460187e-05, "loss": 1.2068, "step": 8833 }, { "epoch": 0.24, "learning_rate": 1.7749462279195825e-05, "loss": 1.156, "step": 8834 }, { "epoch": 0.24, "learning_rate": 1.7748903216303314e-05, "loss": 1.4158, "step": 8835 }, { "epoch": 0.24, "learning_rate": 1.774834409278703e-05, "loss": 1.3839, "step": 8836 }, { "epoch": 0.24, "learning_rate": 1.7747784908651344e-05, "loss": 1.3054, "step": 8837 }, { "epoch": 0.24, "learning_rate": 1.7747225663900633e-05, "loss": 1.3101, "step": 8838 }, { "epoch": 0.24, "learning_rate": 1.774666635853927e-05, "loss": 1.4614, "step": 8839 }, { "epoch": 0.24, "learning_rate": 1.7746106992571635e-05, "loss": 1.4214, "step": 8840 }, { "epoch": 0.24, "learning_rate": 1.77455475660021e-05, "loss": 1.3345, "step": 8841 }, { "epoch": 0.24, "learning_rate": 1.774498807883504e-05, "loss": 1.26, "step": 8842 }, { "epoch": 0.24, "learning_rate": 1.774442853107484e-05, "loss": 1.4387, "step": 8843 }, { "epoch": 0.24, "learning_rate": 1.7743868922725872e-05, "loss": 1.4961, "step": 8844 }, { "epoch": 0.24, "learning_rate": 1.7743309253792512e-05, "loss": 1.1555, "step": 8845 }, { "epoch": 0.24, "learning_rate": 1.7742749524279143e-05, "loss": 1.0894, "step": 8846 }, { "epoch": 0.24, "learning_rate": 1.774218973419014e-05, "loss": 1.4009, "step": 8847 }, { "epoch": 0.24, "learning_rate": 1.7741629883529895e-05, "loss": 1.2651, "step": 8848 }, { "epoch": 0.24, "learning_rate": 1.7741069972302768e-05, "loss": 1.3184, "step": 8849 }, { "epoch": 0.24, "learning_rate": 1.7740510000513154e-05, "loss": 1.3086, "step": 8850 }, { "epoch": 0.24, "learning_rate": 1.7739949968165428e-05, "loss": 1.3535, "step": 8851 }, { "epoch": 0.24, "learning_rate": 1.7739389875263974e-05, "loss": 1.3142, "step": 8852 }, { "epoch": 0.24, "learning_rate": 1.7738829721813173e-05, "loss": 1.2507, "step": 8853 }, { "epoch": 0.24, "learning_rate": 1.773826950781741e-05, "loss": 1.3704, "step": 8854 }, { "epoch": 0.24, "learning_rate": 1.773770923328106e-05, "loss": 1.3691, "step": 8855 }, { "epoch": 0.24, "learning_rate": 1.773714889820851e-05, "loss": 1.2837, "step": 8856 }, { "epoch": 0.24, "learning_rate": 1.773658850260415e-05, "loss": 1.3977, "step": 8857 }, { "epoch": 0.24, "learning_rate": 1.773602804647236e-05, "loss": 1.4644, "step": 8858 }, { "epoch": 0.24, "learning_rate": 1.773546752981752e-05, "loss": 1.2606, "step": 8859 }, { "epoch": 0.24, "learning_rate": 1.7734906952644025e-05, "loss": 1.415, "step": 8860 }, { "epoch": 0.24, "learning_rate": 1.773434631495625e-05, "loss": 1.4189, "step": 8861 }, { "epoch": 0.24, "learning_rate": 1.773378561675859e-05, "loss": 1.3494, "step": 8862 }, { "epoch": 0.24, "learning_rate": 1.7733224858055428e-05, "loss": 1.3303, "step": 8863 }, { "epoch": 0.24, "learning_rate": 1.7732664038851147e-05, "loss": 1.4753, "step": 8864 }, { "epoch": 0.24, "learning_rate": 1.7732103159150143e-05, "loss": 1.4912, "step": 8865 }, { "epoch": 0.24, "learning_rate": 1.7731542218956797e-05, "loss": 1.584, "step": 8866 }, { "epoch": 0.24, "learning_rate": 1.7730981218275503e-05, "loss": 1.469, "step": 8867 }, { "epoch": 0.24, "learning_rate": 1.7730420157110643e-05, "loss": 1.2869, "step": 8868 }, { "epoch": 0.24, "learning_rate": 1.7729859035466617e-05, "loss": 1.5156, "step": 8869 }, { "epoch": 0.24, "learning_rate": 1.7729297853347803e-05, "loss": 1.3218, "step": 8870 }, { "epoch": 0.24, "learning_rate": 1.7728736610758603e-05, "loss": 1.3977, "step": 8871 }, { "epoch": 0.24, "learning_rate": 1.7728175307703396e-05, "loss": 1.3562, "step": 8872 }, { "epoch": 0.24, "learning_rate": 1.7727613944186584e-05, "loss": 1.4062, "step": 8873 }, { "epoch": 0.24, "learning_rate": 1.7727052520212553e-05, "loss": 1.4834, "step": 8874 }, { "epoch": 0.24, "learning_rate": 1.7726491035785694e-05, "loss": 1.3804, "step": 8875 }, { "epoch": 0.24, "learning_rate": 1.7725929490910405e-05, "loss": 1.3142, "step": 8876 }, { "epoch": 0.24, "learning_rate": 1.7725367885591077e-05, "loss": 1.2637, "step": 8877 }, { "epoch": 0.24, "learning_rate": 1.7724806219832104e-05, "loss": 1.4314, "step": 8878 }, { "epoch": 0.24, "learning_rate": 1.7724244493637875e-05, "loss": 1.3765, "step": 8879 }, { "epoch": 0.24, "learning_rate": 1.7723682707012796e-05, "loss": 1.2847, "step": 8880 }, { "epoch": 0.24, "learning_rate": 1.772312085996125e-05, "loss": 1.4688, "step": 8881 }, { "epoch": 0.24, "learning_rate": 1.772255895248764e-05, "loss": 1.377, "step": 8882 }, { "epoch": 0.24, "learning_rate": 1.772199698459636e-05, "loss": 1.405, "step": 8883 }, { "epoch": 0.24, "learning_rate": 1.7721434956291808e-05, "loss": 1.2644, "step": 8884 }, { "epoch": 0.24, "learning_rate": 1.7720872867578377e-05, "loss": 1.3723, "step": 8885 }, { "epoch": 0.24, "learning_rate": 1.772031071846047e-05, "loss": 1.3325, "step": 8886 }, { "epoch": 0.24, "learning_rate": 1.771974850894248e-05, "loss": 1.2371, "step": 8887 }, { "epoch": 0.24, "learning_rate": 1.7719186239028808e-05, "loss": 1.3726, "step": 8888 }, { "epoch": 0.24, "learning_rate": 1.7718623908723854e-05, "loss": 1.2891, "step": 8889 }, { "epoch": 0.24, "learning_rate": 1.7718061518032014e-05, "loss": 1.428, "step": 8890 }, { "epoch": 0.24, "learning_rate": 1.7717499066957692e-05, "loss": 1.4116, "step": 8891 }, { "epoch": 0.24, "learning_rate": 1.7716936555505286e-05, "loss": 1.4287, "step": 8892 }, { "epoch": 0.24, "learning_rate": 1.7716373983679197e-05, "loss": 1.522, "step": 8893 }, { "epoch": 0.24, "learning_rate": 1.7715811351483827e-05, "loss": 1.3269, "step": 8894 }, { "epoch": 0.24, "learning_rate": 1.771524865892358e-05, "loss": 1.3958, "step": 8895 }, { "epoch": 0.24, "learning_rate": 1.771468590600285e-05, "loss": 1.283, "step": 8896 }, { "epoch": 0.24, "learning_rate": 1.771412309272605e-05, "loss": 1.2664, "step": 8897 }, { "epoch": 0.24, "learning_rate": 1.771356021909757e-05, "loss": 1.2859, "step": 8898 }, { "epoch": 0.24, "learning_rate": 1.771299728512183e-05, "loss": 1.2681, "step": 8899 }, { "epoch": 0.24, "learning_rate": 1.7712434290803226e-05, "loss": 1.2363, "step": 8900 }, { "epoch": 0.24, "learning_rate": 1.7711871236146158e-05, "loss": 1.4502, "step": 8901 }, { "epoch": 0.24, "learning_rate": 1.771130812115504e-05, "loss": 1.4365, "step": 8902 }, { "epoch": 0.24, "learning_rate": 1.7710744945834272e-05, "loss": 1.3816, "step": 8903 }, { "epoch": 0.24, "learning_rate": 1.7710181710188263e-05, "loss": 1.3926, "step": 8904 }, { "epoch": 0.24, "learning_rate": 1.7709618414221412e-05, "loss": 1.4004, "step": 8905 }, { "epoch": 0.24, "learning_rate": 1.7709055057938138e-05, "loss": 1.4573, "step": 8906 }, { "epoch": 0.24, "learning_rate": 1.770849164134284e-05, "loss": 1.4243, "step": 8907 }, { "epoch": 0.24, "learning_rate": 1.7707928164439927e-05, "loss": 1.2439, "step": 8908 }, { "epoch": 0.24, "learning_rate": 1.770736462723381e-05, "loss": 1.3989, "step": 8909 }, { "epoch": 0.24, "learning_rate": 1.77068010297289e-05, "loss": 1.3943, "step": 8910 }, { "epoch": 0.24, "learning_rate": 1.7706237371929597e-05, "loss": 1.3779, "step": 8911 }, { "epoch": 0.24, "learning_rate": 1.770567365384032e-05, "loss": 1.2935, "step": 8912 }, { "epoch": 0.24, "learning_rate": 1.770510987546547e-05, "loss": 1.2087, "step": 8913 }, { "epoch": 0.24, "learning_rate": 1.7704546036809472e-05, "loss": 1.2446, "step": 8914 }, { "epoch": 0.24, "learning_rate": 1.7703982137876722e-05, "loss": 1.302, "step": 8915 }, { "epoch": 0.24, "learning_rate": 1.7703418178671642e-05, "loss": 1.3923, "step": 8916 }, { "epoch": 0.24, "learning_rate": 1.770285415919864e-05, "loss": 1.2913, "step": 8917 }, { "epoch": 0.24, "learning_rate": 1.7702290079462127e-05, "loss": 1.4229, "step": 8918 }, { "epoch": 0.24, "learning_rate": 1.770172593946652e-05, "loss": 1.4055, "step": 8919 }, { "epoch": 0.24, "learning_rate": 1.7701161739216233e-05, "loss": 1.5249, "step": 8920 }, { "epoch": 0.24, "learning_rate": 1.770059747871568e-05, "loss": 1.4587, "step": 8921 }, { "epoch": 0.24, "learning_rate": 1.7700033157969266e-05, "loss": 1.3594, "step": 8922 }, { "epoch": 0.24, "learning_rate": 1.7699468776981413e-05, "loss": 1.3491, "step": 8923 }, { "epoch": 0.24, "learning_rate": 1.7698904335756544e-05, "loss": 1.7842, "step": 8924 }, { "epoch": 0.24, "learning_rate": 1.7698339834299064e-05, "loss": 1.3933, "step": 8925 }, { "epoch": 0.24, "learning_rate": 1.7697775272613394e-05, "loss": 1.4951, "step": 8926 }, { "epoch": 0.24, "learning_rate": 1.769721065070395e-05, "loss": 1.3711, "step": 8927 }, { "epoch": 0.24, "learning_rate": 1.7696645968575147e-05, "loss": 1.377, "step": 8928 }, { "epoch": 0.24, "learning_rate": 1.7696081226231407e-05, "loss": 1.3401, "step": 8929 }, { "epoch": 0.24, "learning_rate": 1.7695516423677146e-05, "loss": 1.1094, "step": 8930 }, { "epoch": 0.24, "learning_rate": 1.7694951560916783e-05, "loss": 1.5522, "step": 8931 }, { "epoch": 0.24, "learning_rate": 1.769438663795474e-05, "loss": 1.3296, "step": 8932 }, { "epoch": 0.24, "learning_rate": 1.7693821654795432e-05, "loss": 1.4424, "step": 8933 }, { "epoch": 0.24, "learning_rate": 1.769325661144328e-05, "loss": 1.4475, "step": 8934 }, { "epoch": 0.24, "learning_rate": 1.769269150790271e-05, "loss": 1.2444, "step": 8935 }, { "epoch": 0.24, "learning_rate": 1.7692126344178134e-05, "loss": 1.1858, "step": 8936 }, { "epoch": 0.24, "learning_rate": 1.7691561120273984e-05, "loss": 1.3372, "step": 8937 }, { "epoch": 0.24, "learning_rate": 1.769099583619467e-05, "loss": 1.3848, "step": 8938 }, { "epoch": 0.24, "learning_rate": 1.7690430491944625e-05, "loss": 1.3916, "step": 8939 }, { "epoch": 0.24, "learning_rate": 1.7689865087528267e-05, "loss": 1.3721, "step": 8940 }, { "epoch": 0.24, "learning_rate": 1.7689299622950026e-05, "loss": 1.3589, "step": 8941 }, { "epoch": 0.24, "learning_rate": 1.7688734098214312e-05, "loss": 1.512, "step": 8942 }, { "epoch": 0.24, "learning_rate": 1.7688168513325565e-05, "loss": 1.5227, "step": 8943 }, { "epoch": 0.24, "learning_rate": 1.7687602868288198e-05, "loss": 1.2466, "step": 8944 }, { "epoch": 0.24, "learning_rate": 1.7687037163106643e-05, "loss": 1.3562, "step": 8945 }, { "epoch": 0.24, "learning_rate": 1.7686471397785322e-05, "loss": 1.3674, "step": 8946 }, { "epoch": 0.24, "learning_rate": 1.7685905572328666e-05, "loss": 1.384, "step": 8947 }, { "epoch": 0.24, "learning_rate": 1.7685339686741098e-05, "loss": 1.3025, "step": 8948 }, { "epoch": 0.24, "learning_rate": 1.7684773741027045e-05, "loss": 1.2947, "step": 8949 }, { "epoch": 0.24, "learning_rate": 1.7684207735190935e-05, "loss": 1.4194, "step": 8950 }, { "epoch": 0.24, "learning_rate": 1.7683641669237198e-05, "loss": 1.4194, "step": 8951 }, { "epoch": 0.24, "learning_rate": 1.7683075543170264e-05, "loss": 1.3555, "step": 8952 }, { "epoch": 0.24, "learning_rate": 1.7682509356994558e-05, "loss": 1.2678, "step": 8953 }, { "epoch": 0.24, "learning_rate": 1.7681943110714513e-05, "loss": 1.4585, "step": 8954 }, { "epoch": 0.24, "learning_rate": 1.768137680433456e-05, "loss": 1.4873, "step": 8955 }, { "epoch": 0.24, "learning_rate": 1.768081043785912e-05, "loss": 1.3499, "step": 8956 }, { "epoch": 0.24, "learning_rate": 1.7680244011292634e-05, "loss": 1.2512, "step": 8957 }, { "epoch": 0.24, "learning_rate": 1.7679677524639532e-05, "loss": 1.2905, "step": 8958 }, { "epoch": 0.24, "learning_rate": 1.7679110977904243e-05, "loss": 1.3921, "step": 8959 }, { "epoch": 0.24, "learning_rate": 1.7678544371091196e-05, "loss": 1.2786, "step": 8960 }, { "epoch": 0.24, "learning_rate": 1.7677977704204835e-05, "loss": 1.3191, "step": 8961 }, { "epoch": 0.24, "learning_rate": 1.7677410977249584e-05, "loss": 1.3403, "step": 8962 }, { "epoch": 0.24, "learning_rate": 1.767684419022988e-05, "loss": 1.3049, "step": 8963 }, { "epoch": 0.24, "learning_rate": 1.7676277343150156e-05, "loss": 1.5688, "step": 8964 }, { "epoch": 0.24, "learning_rate": 1.767571043601485e-05, "loss": 1.1956, "step": 8965 }, { "epoch": 0.24, "learning_rate": 1.7675143468828397e-05, "loss": 1.3833, "step": 8966 }, { "epoch": 0.24, "learning_rate": 1.7674576441595226e-05, "loss": 1.3018, "step": 8967 }, { "epoch": 0.24, "learning_rate": 1.767400935431978e-05, "loss": 1.3604, "step": 8968 }, { "epoch": 0.24, "learning_rate": 1.767344220700649e-05, "loss": 1.3813, "step": 8969 }, { "epoch": 0.24, "learning_rate": 1.76728749996598e-05, "loss": 1.2544, "step": 8970 }, { "epoch": 0.24, "learning_rate": 1.7672307732284143e-05, "loss": 1.3522, "step": 8971 }, { "epoch": 0.25, "learning_rate": 1.767174040488396e-05, "loss": 1.437, "step": 8972 }, { "epoch": 0.25, "learning_rate": 1.7671173017463685e-05, "loss": 1.3286, "step": 8973 }, { "epoch": 0.25, "learning_rate": 1.7670605570027763e-05, "loss": 1.5459, "step": 8974 }, { "epoch": 0.25, "learning_rate": 1.7670038062580626e-05, "loss": 1.3401, "step": 8975 }, { "epoch": 0.25, "learning_rate": 1.7669470495126718e-05, "loss": 1.3765, "step": 8976 }, { "epoch": 0.25, "learning_rate": 1.766890286767048e-05, "loss": 1.4753, "step": 8977 }, { "epoch": 0.25, "learning_rate": 1.7668335180216357e-05, "loss": 1.2998, "step": 8978 }, { "epoch": 0.25, "learning_rate": 1.7667767432768777e-05, "loss": 1.4751, "step": 8979 }, { "epoch": 0.25, "learning_rate": 1.7667199625332197e-05, "loss": 1.5015, "step": 8980 }, { "epoch": 0.25, "learning_rate": 1.7666631757911047e-05, "loss": 1.2925, "step": 8981 }, { "epoch": 0.25, "learning_rate": 1.766606383050978e-05, "loss": 1.283, "step": 8982 }, { "epoch": 0.25, "learning_rate": 1.766549584313283e-05, "loss": 1.3037, "step": 8983 }, { "epoch": 0.25, "learning_rate": 1.766492779578465e-05, "loss": 1.3521, "step": 8984 }, { "epoch": 0.25, "learning_rate": 1.7664359688469678e-05, "loss": 1.3369, "step": 8985 }, { "epoch": 0.25, "learning_rate": 1.7663791521192356e-05, "loss": 1.3335, "step": 8986 }, { "epoch": 0.25, "learning_rate": 1.7663223293957136e-05, "loss": 1.3567, "step": 8987 }, { "epoch": 0.25, "learning_rate": 1.766265500676846e-05, "loss": 1.4766, "step": 8988 }, { "epoch": 0.25, "learning_rate": 1.7662086659630777e-05, "loss": 1.3792, "step": 8989 }, { "epoch": 0.25, "learning_rate": 1.7661518252548527e-05, "loss": 1.3167, "step": 8990 }, { "epoch": 0.25, "learning_rate": 1.766094978552616e-05, "loss": 1.2704, "step": 8991 }, { "epoch": 0.25, "learning_rate": 1.766038125856813e-05, "loss": 1.333, "step": 8992 }, { "epoch": 0.25, "learning_rate": 1.7659812671678875e-05, "loss": 1.5081, "step": 8993 }, { "epoch": 0.25, "learning_rate": 1.765924402486285e-05, "loss": 1.313, "step": 8994 }, { "epoch": 0.25, "learning_rate": 1.76586753181245e-05, "loss": 1.3259, "step": 8995 }, { "epoch": 0.25, "learning_rate": 1.7658106551468277e-05, "loss": 1.3477, "step": 8996 }, { "epoch": 0.25, "learning_rate": 1.7657537724898626e-05, "loss": 1.3794, "step": 8997 }, { "epoch": 0.25, "learning_rate": 1.7656968838420004e-05, "loss": 1.8022, "step": 8998 }, { "epoch": 0.25, "learning_rate": 1.7656399892036854e-05, "loss": 1.3359, "step": 8999 }, { "epoch": 0.25, "learning_rate": 1.7655830885753635e-05, "loss": 1.2947, "step": 9000 }, { "epoch": 0.25, "learning_rate": 1.7655261819574796e-05, "loss": 1.189, "step": 9001 }, { "epoch": 0.25, "learning_rate": 1.765469269350479e-05, "loss": 1.4126, "step": 9002 }, { "epoch": 0.25, "learning_rate": 1.765412350754806e-05, "loss": 1.3721, "step": 9003 }, { "epoch": 0.25, "learning_rate": 1.7653554261709075e-05, "loss": 1.3411, "step": 9004 }, { "epoch": 0.25, "learning_rate": 1.7652984955992275e-05, "loss": 1.2703, "step": 9005 }, { "epoch": 0.25, "learning_rate": 1.7652415590402122e-05, "loss": 1.3669, "step": 9006 }, { "epoch": 0.25, "learning_rate": 1.765184616494307e-05, "loss": 1.2896, "step": 9007 }, { "epoch": 0.25, "learning_rate": 1.7651276679619568e-05, "loss": 1.5596, "step": 9008 }, { "epoch": 0.25, "learning_rate": 1.7650707134436075e-05, "loss": 1.2625, "step": 9009 }, { "epoch": 0.25, "learning_rate": 1.765013752939705e-05, "loss": 1.353, "step": 9010 }, { "epoch": 0.25, "learning_rate": 1.7649567864506943e-05, "loss": 1.2773, "step": 9011 }, { "epoch": 0.25, "learning_rate": 1.7648998139770216e-05, "loss": 1.2869, "step": 9012 }, { "epoch": 0.25, "learning_rate": 1.7648428355191325e-05, "loss": 1.4692, "step": 9013 }, { "epoch": 0.25, "learning_rate": 1.7647858510774724e-05, "loss": 1.4192, "step": 9014 }, { "epoch": 0.25, "learning_rate": 1.764728860652488e-05, "loss": 1.3831, "step": 9015 }, { "epoch": 0.25, "learning_rate": 1.7646718642446238e-05, "loss": 1.4751, "step": 9016 }, { "epoch": 0.25, "learning_rate": 1.764614861854327e-05, "loss": 1.3867, "step": 9017 }, { "epoch": 0.25, "learning_rate": 1.7645578534820434e-05, "loss": 1.2715, "step": 9018 }, { "epoch": 0.25, "learning_rate": 1.764500839128218e-05, "loss": 1.3206, "step": 9019 }, { "epoch": 0.25, "learning_rate": 1.764443818793298e-05, "loss": 1.332, "step": 9020 }, { "epoch": 0.25, "learning_rate": 1.7643867924777286e-05, "loss": 1.3083, "step": 9021 }, { "epoch": 0.25, "learning_rate": 1.7643297601819568e-05, "loss": 1.4185, "step": 9022 }, { "epoch": 0.25, "learning_rate": 1.7642727219064282e-05, "loss": 1.272, "step": 9023 }, { "epoch": 0.25, "learning_rate": 1.7642156776515894e-05, "loss": 1.3699, "step": 9024 }, { "epoch": 0.25, "learning_rate": 1.7641586274178862e-05, "loss": 1.3506, "step": 9025 }, { "epoch": 0.25, "learning_rate": 1.764101571205765e-05, "loss": 1.7627, "step": 9026 }, { "epoch": 0.25, "learning_rate": 1.764044509015673e-05, "loss": 1.4087, "step": 9027 }, { "epoch": 0.25, "learning_rate": 1.7639874408480557e-05, "loss": 1.1882, "step": 9028 }, { "epoch": 0.25, "learning_rate": 1.76393036670336e-05, "loss": 1.3025, "step": 9029 }, { "epoch": 0.25, "learning_rate": 1.7638732865820326e-05, "loss": 1.3447, "step": 9030 }, { "epoch": 0.25, "learning_rate": 1.7638162004845194e-05, "loss": 1.3999, "step": 9031 }, { "epoch": 0.25, "learning_rate": 1.7637591084112676e-05, "loss": 1.3606, "step": 9032 }, { "epoch": 0.25, "learning_rate": 1.7637020103627236e-05, "loss": 1.2217, "step": 9033 }, { "epoch": 0.25, "learning_rate": 1.7636449063393342e-05, "loss": 1.314, "step": 9034 }, { "epoch": 0.25, "learning_rate": 1.7635877963415463e-05, "loss": 1.4775, "step": 9035 }, { "epoch": 0.25, "learning_rate": 1.763530680369806e-05, "loss": 1.2799, "step": 9036 }, { "epoch": 0.25, "learning_rate": 1.7634735584245615e-05, "loss": 1.3433, "step": 9037 }, { "epoch": 0.25, "learning_rate": 1.7634164305062585e-05, "loss": 1.3247, "step": 9038 }, { "epoch": 0.25, "learning_rate": 1.7633592966153442e-05, "loss": 1.4397, "step": 9039 }, { "epoch": 0.25, "learning_rate": 1.763302156752266e-05, "loss": 1.3269, "step": 9040 }, { "epoch": 0.25, "learning_rate": 1.7632450109174704e-05, "loss": 1.3159, "step": 9041 }, { "epoch": 0.25, "learning_rate": 1.7631878591114048e-05, "loss": 1.2773, "step": 9042 }, { "epoch": 0.25, "learning_rate": 1.7631307013345164e-05, "loss": 1.2656, "step": 9043 }, { "epoch": 0.25, "learning_rate": 1.763073537587252e-05, "loss": 1.3271, "step": 9044 }, { "epoch": 0.25, "learning_rate": 1.7630163678700594e-05, "loss": 1.4421, "step": 9045 }, { "epoch": 0.25, "learning_rate": 1.7629591921833854e-05, "loss": 1.3496, "step": 9046 }, { "epoch": 0.25, "learning_rate": 1.7629020105276774e-05, "loss": 1.3594, "step": 9047 }, { "epoch": 0.25, "learning_rate": 1.7628448229033826e-05, "loss": 1.2251, "step": 9048 }, { "epoch": 0.25, "learning_rate": 1.7627876293109492e-05, "loss": 1.3022, "step": 9049 }, { "epoch": 0.25, "learning_rate": 1.7627304297508235e-05, "loss": 1.4141, "step": 9050 }, { "epoch": 0.25, "learning_rate": 1.762673224223454e-05, "loss": 1.2837, "step": 9051 }, { "epoch": 0.25, "learning_rate": 1.7626160127292875e-05, "loss": 1.4373, "step": 9052 }, { "epoch": 0.25, "learning_rate": 1.762558795268772e-05, "loss": 1.5312, "step": 9053 }, { "epoch": 0.25, "learning_rate": 1.762501571842355e-05, "loss": 1.3206, "step": 9054 }, { "epoch": 0.25, "learning_rate": 1.7624443424504844e-05, "loss": 1.3599, "step": 9055 }, { "epoch": 0.25, "learning_rate": 1.762387107093608e-05, "loss": 1.4495, "step": 9056 }, { "epoch": 0.25, "learning_rate": 1.762329865772173e-05, "loss": 1.1543, "step": 9057 }, { "epoch": 0.25, "learning_rate": 1.7622726184866277e-05, "loss": 1.2744, "step": 9058 }, { "epoch": 0.25, "learning_rate": 1.76221536523742e-05, "loss": 1.4727, "step": 9059 }, { "epoch": 0.25, "learning_rate": 1.7621581060249974e-05, "loss": 1.4634, "step": 9060 }, { "epoch": 0.25, "learning_rate": 1.7621008408498083e-05, "loss": 1.2952, "step": 9061 }, { "epoch": 0.25, "learning_rate": 1.7620435697123007e-05, "loss": 1.3945, "step": 9062 }, { "epoch": 0.25, "learning_rate": 1.7619862926129226e-05, "loss": 1.4429, "step": 9063 }, { "epoch": 0.25, "learning_rate": 1.761929009552122e-05, "loss": 1.4614, "step": 9064 }, { "epoch": 0.25, "learning_rate": 1.7618717205303474e-05, "loss": 1.3914, "step": 9065 }, { "epoch": 0.25, "learning_rate": 1.7618144255480462e-05, "loss": 1.4485, "step": 9066 }, { "epoch": 0.25, "learning_rate": 1.7617571246056674e-05, "loss": 1.4026, "step": 9067 }, { "epoch": 0.25, "learning_rate": 1.761699817703659e-05, "loss": 1.4009, "step": 9068 }, { "epoch": 0.25, "learning_rate": 1.7616425048424695e-05, "loss": 1.3765, "step": 9069 }, { "epoch": 0.25, "learning_rate": 1.761585186022547e-05, "loss": 1.2659, "step": 9070 }, { "epoch": 0.25, "learning_rate": 1.7615278612443402e-05, "loss": 1.4087, "step": 9071 }, { "epoch": 0.25, "learning_rate": 1.7614705305082975e-05, "loss": 1.4048, "step": 9072 }, { "epoch": 0.25, "learning_rate": 1.7614131938148674e-05, "loss": 1.356, "step": 9073 }, { "epoch": 0.25, "learning_rate": 1.761355851164499e-05, "loss": 1.332, "step": 9074 }, { "epoch": 0.25, "learning_rate": 1.7612985025576398e-05, "loss": 1.3811, "step": 9075 }, { "epoch": 0.25, "learning_rate": 1.7612411479947392e-05, "loss": 1.3816, "step": 9076 }, { "epoch": 0.25, "learning_rate": 1.7611837874762462e-05, "loss": 1.3745, "step": 9077 }, { "epoch": 0.25, "learning_rate": 1.761126421002609e-05, "loss": 1.4929, "step": 9078 }, { "epoch": 0.25, "learning_rate": 1.7610690485742763e-05, "loss": 1.4827, "step": 9079 }, { "epoch": 0.25, "learning_rate": 1.7610116701916976e-05, "loss": 1.3784, "step": 9080 }, { "epoch": 0.25, "learning_rate": 1.760954285855321e-05, "loss": 1.3667, "step": 9081 }, { "epoch": 0.25, "learning_rate": 1.7608968955655967e-05, "loss": 1.5117, "step": 9082 }, { "epoch": 0.25, "learning_rate": 1.7608394993229722e-05, "loss": 1.3953, "step": 9083 }, { "epoch": 0.25, "learning_rate": 1.7607820971278978e-05, "loss": 1.4595, "step": 9084 }, { "epoch": 0.25, "learning_rate": 1.7607246889808215e-05, "loss": 1.4321, "step": 9085 }, { "epoch": 0.25, "learning_rate": 1.760667274882193e-05, "loss": 1.2822, "step": 9086 }, { "epoch": 0.25, "learning_rate": 1.7606098548324615e-05, "loss": 1.3215, "step": 9087 }, { "epoch": 0.25, "learning_rate": 1.7605524288320764e-05, "loss": 1.394, "step": 9088 }, { "epoch": 0.25, "learning_rate": 1.7604949968814864e-05, "loss": 1.5132, "step": 9089 }, { "epoch": 0.25, "learning_rate": 1.760437558981141e-05, "loss": 1.3477, "step": 9090 }, { "epoch": 0.25, "learning_rate": 1.7603801151314903e-05, "loss": 1.2207, "step": 9091 }, { "epoch": 0.25, "learning_rate": 1.7603226653329826e-05, "loss": 1.2783, "step": 9092 }, { "epoch": 0.25, "learning_rate": 1.7602652095860682e-05, "loss": 1.4033, "step": 9093 }, { "epoch": 0.25, "learning_rate": 1.7602077478911967e-05, "loss": 1.1851, "step": 9094 }, { "epoch": 0.25, "learning_rate": 1.7601502802488165e-05, "loss": 1.4302, "step": 9095 }, { "epoch": 0.25, "learning_rate": 1.7600928066593784e-05, "loss": 1.2856, "step": 9096 }, { "epoch": 0.25, "learning_rate": 1.7600353271233316e-05, "loss": 1.291, "step": 9097 }, { "epoch": 0.25, "learning_rate": 1.7599778416411257e-05, "loss": 1.3411, "step": 9098 }, { "epoch": 0.25, "learning_rate": 1.7599203502132103e-05, "loss": 1.3685, "step": 9099 }, { "epoch": 0.25, "learning_rate": 1.7598628528400353e-05, "loss": 1.4136, "step": 9100 }, { "epoch": 0.25, "learning_rate": 1.759805349522051e-05, "loss": 1.3667, "step": 9101 }, { "epoch": 0.25, "learning_rate": 1.759747840259707e-05, "loss": 1.436, "step": 9102 }, { "epoch": 0.25, "learning_rate": 1.759690325053453e-05, "loss": 1.3564, "step": 9103 }, { "epoch": 0.25, "learning_rate": 1.759632803903739e-05, "loss": 1.3877, "step": 9104 }, { "epoch": 0.25, "learning_rate": 1.7595752768110155e-05, "loss": 1.3872, "step": 9105 }, { "epoch": 0.25, "learning_rate": 1.759517743775732e-05, "loss": 1.2993, "step": 9106 }, { "epoch": 0.25, "learning_rate": 1.7594602047983388e-05, "loss": 1.334, "step": 9107 }, { "epoch": 0.25, "learning_rate": 1.759402659879286e-05, "loss": 1.3796, "step": 9108 }, { "epoch": 0.25, "learning_rate": 1.7593451090190245e-05, "loss": 1.3735, "step": 9109 }, { "epoch": 0.25, "learning_rate": 1.759287552218003e-05, "loss": 1.5095, "step": 9110 }, { "epoch": 0.25, "learning_rate": 1.7592299894766735e-05, "loss": 1.2622, "step": 9111 }, { "epoch": 0.25, "learning_rate": 1.759172420795485e-05, "loss": 1.3579, "step": 9112 }, { "epoch": 0.25, "learning_rate": 1.7591148461748888e-05, "loss": 1.4209, "step": 9113 }, { "epoch": 0.25, "learning_rate": 1.759057265615335e-05, "loss": 1.3435, "step": 9114 }, { "epoch": 0.25, "learning_rate": 1.758999679117274e-05, "loss": 1.2529, "step": 9115 }, { "epoch": 0.25, "learning_rate": 1.7589420866811562e-05, "loss": 1.3682, "step": 9116 }, { "epoch": 0.25, "learning_rate": 1.758884488307433e-05, "loss": 1.2952, "step": 9117 }, { "epoch": 0.25, "learning_rate": 1.758826883996554e-05, "loss": 1.3101, "step": 9118 }, { "epoch": 0.25, "learning_rate": 1.7587692737489702e-05, "loss": 1.3945, "step": 9119 }, { "epoch": 0.25, "learning_rate": 1.7587116575651326e-05, "loss": 1.499, "step": 9120 }, { "epoch": 0.25, "learning_rate": 1.7586540354454917e-05, "loss": 1.4226, "step": 9121 }, { "epoch": 0.25, "learning_rate": 1.7585964073904982e-05, "loss": 1.3445, "step": 9122 }, { "epoch": 0.25, "learning_rate": 1.7585387734006033e-05, "loss": 1.3335, "step": 9123 }, { "epoch": 0.25, "learning_rate": 1.758481133476258e-05, "loss": 1.3386, "step": 9124 }, { "epoch": 0.25, "learning_rate": 1.7584234876179124e-05, "loss": 1.3054, "step": 9125 }, { "epoch": 0.25, "learning_rate": 1.7583658358260185e-05, "loss": 1.3311, "step": 9126 }, { "epoch": 0.25, "learning_rate": 1.758308178101027e-05, "loss": 1.3328, "step": 9127 }, { "epoch": 0.25, "learning_rate": 1.7582505144433883e-05, "loss": 1.2844, "step": 9128 }, { "epoch": 0.25, "learning_rate": 1.7581928448535545e-05, "loss": 1.2312, "step": 9129 }, { "epoch": 0.25, "learning_rate": 1.7581351693319764e-05, "loss": 1.3381, "step": 9130 }, { "epoch": 0.25, "learning_rate": 1.7580774878791053e-05, "loss": 1.4695, "step": 9131 }, { "epoch": 0.25, "learning_rate": 1.7580198004953922e-05, "loss": 1.4717, "step": 9132 }, { "epoch": 0.25, "learning_rate": 1.7579621071812887e-05, "loss": 1.2737, "step": 9133 }, { "epoch": 0.25, "learning_rate": 1.7579044079372465e-05, "loss": 1.5605, "step": 9134 }, { "epoch": 0.25, "learning_rate": 1.757846702763716e-05, "loss": 1.3708, "step": 9135 }, { "epoch": 0.25, "learning_rate": 1.75778899166115e-05, "loss": 1.324, "step": 9136 }, { "epoch": 0.25, "learning_rate": 1.7577312746299986e-05, "loss": 1.2502, "step": 9137 }, { "epoch": 0.25, "learning_rate": 1.7576735516707143e-05, "loss": 1.4282, "step": 9138 }, { "epoch": 0.25, "learning_rate": 1.757615822783748e-05, "loss": 1.3418, "step": 9139 }, { "epoch": 0.25, "learning_rate": 1.7575580879695524e-05, "loss": 1.3367, "step": 9140 }, { "epoch": 0.25, "learning_rate": 1.7575003472285783e-05, "loss": 1.2971, "step": 9141 }, { "epoch": 0.25, "learning_rate": 1.7574426005612776e-05, "loss": 1.5005, "step": 9142 }, { "epoch": 0.25, "learning_rate": 1.757384847968102e-05, "loss": 1.178, "step": 9143 }, { "epoch": 0.25, "learning_rate": 1.757327089449504e-05, "loss": 1.5542, "step": 9144 }, { "epoch": 0.25, "learning_rate": 1.7572693250059345e-05, "loss": 1.2998, "step": 9145 }, { "epoch": 0.25, "learning_rate": 1.7572115546378462e-05, "loss": 1.3892, "step": 9146 }, { "epoch": 0.25, "learning_rate": 1.7571537783456905e-05, "loss": 1.4014, "step": 9147 }, { "epoch": 0.25, "learning_rate": 1.7570959961299196e-05, "loss": 1.3528, "step": 9148 }, { "epoch": 0.25, "learning_rate": 1.757038207990986e-05, "loss": 1.4053, "step": 9149 }, { "epoch": 0.25, "learning_rate": 1.7569804139293413e-05, "loss": 1.3149, "step": 9150 }, { "epoch": 0.25, "learning_rate": 1.756922613945438e-05, "loss": 1.3311, "step": 9151 }, { "epoch": 0.25, "learning_rate": 1.756864808039728e-05, "loss": 1.3911, "step": 9152 }, { "epoch": 0.25, "learning_rate": 1.7568069962126633e-05, "loss": 1.4409, "step": 9153 }, { "epoch": 0.25, "learning_rate": 1.7567491784646968e-05, "loss": 1.4539, "step": 9154 }, { "epoch": 0.25, "learning_rate": 1.7566913547962807e-05, "loss": 1.4009, "step": 9155 }, { "epoch": 0.25, "learning_rate": 1.756633525207867e-05, "loss": 1.4077, "step": 9156 }, { "epoch": 0.25, "learning_rate": 1.7565756896999082e-05, "loss": 1.3823, "step": 9157 }, { "epoch": 0.25, "learning_rate": 1.756517848272857e-05, "loss": 1.2744, "step": 9158 }, { "epoch": 0.25, "learning_rate": 1.7564600009271668e-05, "loss": 1.4775, "step": 9159 }, { "epoch": 0.25, "learning_rate": 1.7564021476632884e-05, "loss": 1.3152, "step": 9160 }, { "epoch": 0.25, "learning_rate": 1.7563442884816756e-05, "loss": 1.4253, "step": 9161 }, { "epoch": 0.25, "learning_rate": 1.7562864233827805e-05, "loss": 1.4216, "step": 9162 }, { "epoch": 0.25, "learning_rate": 1.7562285523670563e-05, "loss": 1.2783, "step": 9163 }, { "epoch": 0.25, "learning_rate": 1.7561706754349553e-05, "loss": 1.3767, "step": 9164 }, { "epoch": 0.25, "learning_rate": 1.7561127925869306e-05, "loss": 1.3579, "step": 9165 }, { "epoch": 0.25, "learning_rate": 1.7560549038234352e-05, "loss": 1.3047, "step": 9166 }, { "epoch": 0.25, "learning_rate": 1.7559970091449213e-05, "loss": 1.3171, "step": 9167 }, { "epoch": 0.25, "learning_rate": 1.7559391085518424e-05, "loss": 1.4568, "step": 9168 }, { "epoch": 0.25, "learning_rate": 1.7558812020446516e-05, "loss": 1.1799, "step": 9169 }, { "epoch": 0.25, "learning_rate": 1.7558232896238018e-05, "loss": 1.2861, "step": 9170 }, { "epoch": 0.25, "learning_rate": 1.7557653712897458e-05, "loss": 1.425, "step": 9171 }, { "epoch": 0.25, "learning_rate": 1.755707447042937e-05, "loss": 1.3083, "step": 9172 }, { "epoch": 0.25, "learning_rate": 1.7556495168838285e-05, "loss": 1.3899, "step": 9173 }, { "epoch": 0.25, "learning_rate": 1.7555915808128734e-05, "loss": 1.2397, "step": 9174 }, { "epoch": 0.25, "learning_rate": 1.755533638830525e-05, "loss": 1.3586, "step": 9175 }, { "epoch": 0.25, "learning_rate": 1.755475690937237e-05, "loss": 1.5508, "step": 9176 }, { "epoch": 0.25, "learning_rate": 1.755417737133462e-05, "loss": 1.4355, "step": 9177 }, { "epoch": 0.25, "learning_rate": 1.755359777419654e-05, "loss": 1.541, "step": 9178 }, { "epoch": 0.25, "learning_rate": 1.7553018117962666e-05, "loss": 1.5056, "step": 9179 }, { "epoch": 0.25, "learning_rate": 1.7552438402637527e-05, "loss": 1.3442, "step": 9180 }, { "epoch": 0.25, "learning_rate": 1.7551858628225664e-05, "loss": 1.3105, "step": 9181 }, { "epoch": 0.25, "learning_rate": 1.7551278794731606e-05, "loss": 1.3025, "step": 9182 }, { "epoch": 0.25, "learning_rate": 1.7550698902159897e-05, "loss": 1.3975, "step": 9183 }, { "epoch": 0.25, "learning_rate": 1.755011895051507e-05, "loss": 1.2856, "step": 9184 }, { "epoch": 0.25, "learning_rate": 1.7549538939801662e-05, "loss": 1.2678, "step": 9185 }, { "epoch": 0.25, "learning_rate": 1.7548958870024213e-05, "loss": 1.3555, "step": 9186 }, { "epoch": 0.25, "learning_rate": 1.754837874118726e-05, "loss": 1.3359, "step": 9187 }, { "epoch": 0.25, "learning_rate": 1.7547798553295338e-05, "loss": 1.4316, "step": 9188 }, { "epoch": 0.25, "learning_rate": 1.754721830635299e-05, "loss": 1.3247, "step": 9189 }, { "epoch": 0.25, "learning_rate": 1.7546638000364752e-05, "loss": 1.3076, "step": 9190 }, { "epoch": 0.25, "learning_rate": 1.7546057635335172e-05, "loss": 1.3967, "step": 9191 }, { "epoch": 0.25, "learning_rate": 1.7545477211268784e-05, "loss": 1.0857, "step": 9192 }, { "epoch": 0.25, "learning_rate": 1.7544896728170133e-05, "loss": 1.4775, "step": 9193 }, { "epoch": 0.25, "learning_rate": 1.7544316186043754e-05, "loss": 1.3677, "step": 9194 }, { "epoch": 0.25, "learning_rate": 1.7543735584894195e-05, "loss": 1.3372, "step": 9195 }, { "epoch": 0.25, "learning_rate": 1.7543154924725993e-05, "loss": 1.2317, "step": 9196 }, { "epoch": 0.25, "learning_rate": 1.7542574205543698e-05, "loss": 1.4556, "step": 9197 }, { "epoch": 0.25, "learning_rate": 1.7541993427351846e-05, "loss": 1.3682, "step": 9198 }, { "epoch": 0.25, "learning_rate": 1.7541412590154987e-05, "loss": 1.302, "step": 9199 }, { "epoch": 0.25, "learning_rate": 1.754083169395766e-05, "loss": 1.4043, "step": 9200 }, { "epoch": 0.25, "learning_rate": 1.7540250738764412e-05, "loss": 1.3521, "step": 9201 }, { "epoch": 0.25, "learning_rate": 1.7539669724579785e-05, "loss": 1.4092, "step": 9202 }, { "epoch": 0.25, "learning_rate": 1.7539088651408333e-05, "loss": 1.3577, "step": 9203 }, { "epoch": 0.25, "learning_rate": 1.7538507519254592e-05, "loss": 1.1619, "step": 9204 }, { "epoch": 0.25, "learning_rate": 1.7537926328123116e-05, "loss": 1.3777, "step": 9205 }, { "epoch": 0.25, "learning_rate": 1.753734507801845e-05, "loss": 1.2529, "step": 9206 }, { "epoch": 0.25, "learning_rate": 1.7536763768945136e-05, "loss": 1.2339, "step": 9207 }, { "epoch": 0.25, "learning_rate": 1.753618240090773e-05, "loss": 1.177, "step": 9208 }, { "epoch": 0.25, "learning_rate": 1.7535600973910773e-05, "loss": 1.4207, "step": 9209 }, { "epoch": 0.25, "learning_rate": 1.753501948795882e-05, "loss": 1.4912, "step": 9210 }, { "epoch": 0.25, "learning_rate": 1.7534437943056418e-05, "loss": 1.4299, "step": 9211 }, { "epoch": 0.25, "learning_rate": 1.7533856339208118e-05, "loss": 1.2412, "step": 9212 }, { "epoch": 0.25, "learning_rate": 1.7533274676418464e-05, "loss": 1.3528, "step": 9213 }, { "epoch": 0.25, "learning_rate": 1.7532692954692018e-05, "loss": 1.3467, "step": 9214 }, { "epoch": 0.25, "learning_rate": 1.753211117403332e-05, "loss": 1.4814, "step": 9215 }, { "epoch": 0.25, "learning_rate": 1.7531529334446923e-05, "loss": 1.3826, "step": 9216 }, { "epoch": 0.25, "learning_rate": 1.7530947435937385e-05, "loss": 1.4124, "step": 9217 }, { "epoch": 0.25, "learning_rate": 1.7530365478509256e-05, "loss": 1.3647, "step": 9218 }, { "epoch": 0.25, "learning_rate": 1.7529783462167088e-05, "loss": 1.4932, "step": 9219 }, { "epoch": 0.25, "learning_rate": 1.752920138691544e-05, "loss": 1.3064, "step": 9220 }, { "epoch": 0.25, "learning_rate": 1.7528619252758855e-05, "loss": 1.3782, "step": 9221 }, { "epoch": 0.25, "learning_rate": 1.752803705970189e-05, "loss": 1.3989, "step": 9222 }, { "epoch": 0.25, "learning_rate": 1.7527454807749113e-05, "loss": 1.271, "step": 9223 }, { "epoch": 0.25, "learning_rate": 1.752687249690506e-05, "loss": 1.2417, "step": 9224 }, { "epoch": 0.25, "learning_rate": 1.75262901271743e-05, "loss": 1.4233, "step": 9225 }, { "epoch": 0.25, "learning_rate": 1.7525707698561383e-05, "loss": 1.3853, "step": 9226 }, { "epoch": 0.25, "learning_rate": 1.7525125211070874e-05, "loss": 1.2571, "step": 9227 }, { "epoch": 0.25, "learning_rate": 1.752454266470732e-05, "loss": 1.3425, "step": 9228 }, { "epoch": 0.25, "learning_rate": 1.752396005947528e-05, "loss": 1.3499, "step": 9229 }, { "epoch": 0.25, "learning_rate": 1.7523377395379316e-05, "loss": 1.3464, "step": 9230 }, { "epoch": 0.25, "learning_rate": 1.7522794672423988e-05, "loss": 1.3862, "step": 9231 }, { "epoch": 0.25, "learning_rate": 1.752221189061385e-05, "loss": 1.354, "step": 9232 }, { "epoch": 0.25, "learning_rate": 1.752162904995346e-05, "loss": 1.3596, "step": 9233 }, { "epoch": 0.25, "learning_rate": 1.7521046150447386e-05, "loss": 1.3372, "step": 9234 }, { "epoch": 0.25, "learning_rate": 1.7520463192100183e-05, "loss": 1.3796, "step": 9235 }, { "epoch": 0.25, "learning_rate": 1.751988017491641e-05, "loss": 1.3254, "step": 9236 }, { "epoch": 0.25, "learning_rate": 1.7519297098900633e-05, "loss": 1.2288, "step": 9237 }, { "epoch": 0.25, "learning_rate": 1.7518713964057408e-05, "loss": 1.283, "step": 9238 }, { "epoch": 0.25, "learning_rate": 1.7518130770391302e-05, "loss": 1.3752, "step": 9239 }, { "epoch": 0.25, "learning_rate": 1.7517547517906876e-05, "loss": 1.4902, "step": 9240 }, { "epoch": 0.25, "learning_rate": 1.7516964206608697e-05, "loss": 1.3562, "step": 9241 }, { "epoch": 0.25, "learning_rate": 1.751638083650132e-05, "loss": 1.3408, "step": 9242 }, { "epoch": 0.25, "learning_rate": 1.7515797407589318e-05, "loss": 1.2058, "step": 9243 }, { "epoch": 0.25, "learning_rate": 1.7515213919877246e-05, "loss": 1.4326, "step": 9244 }, { "epoch": 0.25, "learning_rate": 1.7514630373369676e-05, "loss": 1.7568, "step": 9245 }, { "epoch": 0.25, "learning_rate": 1.7514046768071175e-05, "loss": 1.436, "step": 9246 }, { "epoch": 0.25, "learning_rate": 1.75134631039863e-05, "loss": 1.4785, "step": 9247 }, { "epoch": 0.25, "learning_rate": 1.7512879381119624e-05, "loss": 1.3591, "step": 9248 }, { "epoch": 0.25, "learning_rate": 1.7512295599475718e-05, "loss": 1.439, "step": 9249 }, { "epoch": 0.25, "learning_rate": 1.7511711759059137e-05, "loss": 1.356, "step": 9250 }, { "epoch": 0.25, "learning_rate": 1.751112785987446e-05, "loss": 1.4243, "step": 9251 }, { "epoch": 0.25, "learning_rate": 1.7510543901926248e-05, "loss": 1.2935, "step": 9252 }, { "epoch": 0.25, "learning_rate": 1.7509959885219074e-05, "loss": 1.3704, "step": 9253 }, { "epoch": 0.25, "learning_rate": 1.7509375809757504e-05, "loss": 1.4648, "step": 9254 }, { "epoch": 0.25, "learning_rate": 1.7508791675546112e-05, "loss": 1.4751, "step": 9255 }, { "epoch": 0.25, "learning_rate": 1.750820748258946e-05, "loss": 1.4026, "step": 9256 }, { "epoch": 0.25, "learning_rate": 1.7507623230892126e-05, "loss": 1.4468, "step": 9257 }, { "epoch": 0.25, "learning_rate": 1.7507038920458677e-05, "loss": 1.3979, "step": 9258 }, { "epoch": 0.25, "learning_rate": 1.7506454551293684e-05, "loss": 1.2852, "step": 9259 }, { "epoch": 0.25, "learning_rate": 1.7505870123401725e-05, "loss": 1.3333, "step": 9260 }, { "epoch": 0.25, "learning_rate": 1.7505285636787364e-05, "loss": 1.3372, "step": 9261 }, { "epoch": 0.25, "learning_rate": 1.750470109145518e-05, "loss": 1.4177, "step": 9262 }, { "epoch": 0.25, "learning_rate": 1.7504116487409742e-05, "loss": 1.3086, "step": 9263 }, { "epoch": 0.25, "learning_rate": 1.7503531824655625e-05, "loss": 1.5181, "step": 9264 }, { "epoch": 0.25, "learning_rate": 1.7502947103197402e-05, "loss": 1.5386, "step": 9265 }, { "epoch": 0.25, "learning_rate": 1.7502362323039653e-05, "loss": 1.175, "step": 9266 }, { "epoch": 0.25, "learning_rate": 1.7501777484186946e-05, "loss": 1.4004, "step": 9267 }, { "epoch": 0.25, "learning_rate": 1.750119258664386e-05, "loss": 1.342, "step": 9268 }, { "epoch": 0.25, "learning_rate": 1.7500607630414973e-05, "loss": 1.7705, "step": 9269 }, { "epoch": 0.25, "learning_rate": 1.750002261550486e-05, "loss": 1.4167, "step": 9270 }, { "epoch": 0.25, "learning_rate": 1.7499437541918088e-05, "loss": 1.2056, "step": 9271 }, { "epoch": 0.25, "learning_rate": 1.749885240965925e-05, "loss": 1.3384, "step": 9272 }, { "epoch": 0.25, "learning_rate": 1.7498267218732917e-05, "loss": 1.4595, "step": 9273 }, { "epoch": 0.25, "learning_rate": 1.7497681969143665e-05, "loss": 1.4419, "step": 9274 }, { "epoch": 0.25, "learning_rate": 1.7497096660896076e-05, "loss": 1.3198, "step": 9275 }, { "epoch": 0.25, "learning_rate": 1.7496511293994725e-05, "loss": 1.3044, "step": 9276 }, { "epoch": 0.25, "learning_rate": 1.74959258684442e-05, "loss": 1.2842, "step": 9277 }, { "epoch": 0.25, "learning_rate": 1.7495340384249074e-05, "loss": 1.3042, "step": 9278 }, { "epoch": 0.25, "learning_rate": 1.749475484141393e-05, "loss": 1.3562, "step": 9279 }, { "epoch": 0.25, "learning_rate": 1.7494169239943347e-05, "loss": 1.2344, "step": 9280 }, { "epoch": 0.25, "learning_rate": 1.7493583579841908e-05, "loss": 1.3235, "step": 9281 }, { "epoch": 0.25, "learning_rate": 1.7492997861114194e-05, "loss": 1.4585, "step": 9282 }, { "epoch": 0.25, "learning_rate": 1.749241208376479e-05, "loss": 1.1343, "step": 9283 }, { "epoch": 0.25, "learning_rate": 1.7491826247798278e-05, "loss": 1.4771, "step": 9284 }, { "epoch": 0.25, "learning_rate": 1.749124035321924e-05, "loss": 1.2532, "step": 9285 }, { "epoch": 0.25, "learning_rate": 1.7490654400032257e-05, "loss": 1.4595, "step": 9286 }, { "epoch": 0.25, "learning_rate": 1.7490068388241915e-05, "loss": 1.3, "step": 9287 }, { "epoch": 0.25, "learning_rate": 1.7489482317852803e-05, "loss": 1.4507, "step": 9288 }, { "epoch": 0.25, "learning_rate": 1.7488896188869503e-05, "loss": 1.5093, "step": 9289 }, { "epoch": 0.25, "learning_rate": 1.7488310001296605e-05, "loss": 1.5088, "step": 9290 }, { "epoch": 0.25, "learning_rate": 1.7487723755138687e-05, "loss": 1.3274, "step": 9291 }, { "epoch": 0.25, "learning_rate": 1.748713745040034e-05, "loss": 1.2747, "step": 9292 }, { "epoch": 0.25, "learning_rate": 1.7486551087086146e-05, "loss": 1.3948, "step": 9293 }, { "epoch": 0.25, "learning_rate": 1.7485964665200703e-05, "loss": 1.3708, "step": 9294 }, { "epoch": 0.25, "learning_rate": 1.748537818474859e-05, "loss": 1.4048, "step": 9295 }, { "epoch": 0.25, "learning_rate": 1.7484791645734396e-05, "loss": 1.3057, "step": 9296 }, { "epoch": 0.25, "learning_rate": 1.7484205048162715e-05, "loss": 1.4021, "step": 9297 }, { "epoch": 0.25, "learning_rate": 1.748361839203813e-05, "loss": 1.2686, "step": 9298 }, { "epoch": 0.25, "learning_rate": 1.7483031677365234e-05, "loss": 1.2803, "step": 9299 }, { "epoch": 0.25, "learning_rate": 1.748244490414862e-05, "loss": 1.4065, "step": 9300 }, { "epoch": 0.25, "learning_rate": 1.7481858072392875e-05, "loss": 1.2886, "step": 9301 }, { "epoch": 0.25, "learning_rate": 1.748127118210259e-05, "loss": 1.4514, "step": 9302 }, { "epoch": 0.25, "learning_rate": 1.7480684233282353e-05, "loss": 1.2693, "step": 9303 }, { "epoch": 0.25, "learning_rate": 1.7480097225936766e-05, "loss": 1.199, "step": 9304 }, { "epoch": 0.25, "learning_rate": 1.747951016007041e-05, "loss": 1.3994, "step": 9305 }, { "epoch": 0.25, "learning_rate": 1.7478923035687893e-05, "loss": 1.356, "step": 9306 }, { "epoch": 0.25, "learning_rate": 1.747833585279379e-05, "loss": 1.2917, "step": 9307 }, { "epoch": 0.25, "learning_rate": 1.7477748611392706e-05, "loss": 1.4167, "step": 9308 }, { "epoch": 0.25, "learning_rate": 1.7477161311489234e-05, "loss": 1.4058, "step": 9309 }, { "epoch": 0.25, "learning_rate": 1.7476573953087968e-05, "loss": 1.3928, "step": 9310 }, { "epoch": 0.25, "learning_rate": 1.7475986536193504e-05, "loss": 1.3105, "step": 9311 }, { "epoch": 0.25, "learning_rate": 1.7475399060810436e-05, "loss": 1.1931, "step": 9312 }, { "epoch": 0.25, "learning_rate": 1.747481152694336e-05, "loss": 1.1204, "step": 9313 }, { "epoch": 0.25, "learning_rate": 1.7474223934596875e-05, "loss": 1.2717, "step": 9314 }, { "epoch": 0.25, "learning_rate": 1.7473636283775577e-05, "loss": 1.2468, "step": 9315 }, { "epoch": 0.25, "learning_rate": 1.747304857448406e-05, "loss": 1.2646, "step": 9316 }, { "epoch": 0.25, "learning_rate": 1.7472460806726928e-05, "loss": 1.4885, "step": 9317 }, { "epoch": 0.25, "learning_rate": 1.7471872980508776e-05, "loss": 1.4707, "step": 9318 }, { "epoch": 0.25, "learning_rate": 1.7471285095834204e-05, "loss": 1.4985, "step": 9319 }, { "epoch": 0.25, "learning_rate": 1.7470697152707806e-05, "loss": 1.7319, "step": 9320 }, { "epoch": 0.25, "learning_rate": 1.7470109151134193e-05, "loss": 1.3398, "step": 9321 }, { "epoch": 0.25, "learning_rate": 1.7469521091117957e-05, "loss": 1.3916, "step": 9322 }, { "epoch": 0.25, "learning_rate": 1.7468932972663697e-05, "loss": 1.3647, "step": 9323 }, { "epoch": 0.25, "learning_rate": 1.746834479577602e-05, "loss": 1.4229, "step": 9324 }, { "epoch": 0.25, "learning_rate": 1.7467756560459525e-05, "loss": 1.4058, "step": 9325 }, { "epoch": 0.25, "learning_rate": 1.7467168266718813e-05, "loss": 1.7461, "step": 9326 }, { "epoch": 0.25, "learning_rate": 1.7466579914558487e-05, "loss": 1.5337, "step": 9327 }, { "epoch": 0.25, "learning_rate": 1.7465991503983154e-05, "loss": 1.4106, "step": 9328 }, { "epoch": 0.25, "learning_rate": 1.7465403034997415e-05, "loss": 1.4189, "step": 9329 }, { "epoch": 0.25, "learning_rate": 1.746481450760587e-05, "loss": 1.501, "step": 9330 }, { "epoch": 0.25, "learning_rate": 1.7464225921813125e-05, "loss": 1.2207, "step": 9331 }, { "epoch": 0.25, "learning_rate": 1.746363727762379e-05, "loss": 1.3623, "step": 9332 }, { "epoch": 0.25, "learning_rate": 1.7463048575042465e-05, "loss": 1.3435, "step": 9333 }, { "epoch": 0.25, "learning_rate": 1.746245981407376e-05, "loss": 1.2844, "step": 9334 }, { "epoch": 0.25, "learning_rate": 1.7461870994722274e-05, "loss": 1.3926, "step": 9335 }, { "epoch": 0.25, "learning_rate": 1.746128211699262e-05, "loss": 1.3208, "step": 9336 }, { "epoch": 0.25, "learning_rate": 1.7460693180889406e-05, "loss": 1.4292, "step": 9337 }, { "epoch": 0.26, "learning_rate": 1.7460104186417234e-05, "loss": 1.4756, "step": 9338 }, { "epoch": 0.26, "learning_rate": 1.7459515133580713e-05, "loss": 1.3196, "step": 9339 }, { "epoch": 0.26, "learning_rate": 1.7458926022384456e-05, "loss": 1.3984, "step": 9340 }, { "epoch": 0.26, "learning_rate": 1.745833685283307e-05, "loss": 1.3567, "step": 9341 }, { "epoch": 0.26, "learning_rate": 1.7457747624931163e-05, "loss": 1.3123, "step": 9342 }, { "epoch": 0.26, "learning_rate": 1.7457158338683344e-05, "loss": 1.4482, "step": 9343 }, { "epoch": 0.26, "learning_rate": 1.7456568994094225e-05, "loss": 1.3171, "step": 9344 }, { "epoch": 0.26, "learning_rate": 1.7455979591168417e-05, "loss": 1.3152, "step": 9345 }, { "epoch": 0.26, "learning_rate": 1.7455390129910532e-05, "loss": 1.2773, "step": 9346 }, { "epoch": 0.26, "learning_rate": 1.745480061032518e-05, "loss": 1.4146, "step": 9347 }, { "epoch": 0.26, "learning_rate": 1.745421103241697e-05, "loss": 1.4304, "step": 9348 }, { "epoch": 0.26, "learning_rate": 1.7453621396190522e-05, "loss": 1.3677, "step": 9349 }, { "epoch": 0.26, "learning_rate": 1.7453031701650444e-05, "loss": 1.48, "step": 9350 }, { "epoch": 0.26, "learning_rate": 1.7452441948801352e-05, "loss": 1.4463, "step": 9351 }, { "epoch": 0.26, "learning_rate": 1.7451852137647858e-05, "loss": 1.3013, "step": 9352 }, { "epoch": 0.26, "learning_rate": 1.7451262268194575e-05, "loss": 1.2654, "step": 9353 }, { "epoch": 0.26, "learning_rate": 1.745067234044612e-05, "loss": 1.4705, "step": 9354 }, { "epoch": 0.26, "learning_rate": 1.745008235440711e-05, "loss": 1.3101, "step": 9355 }, { "epoch": 0.26, "learning_rate": 1.7449492310082158e-05, "loss": 1.5032, "step": 9356 }, { "epoch": 0.26, "learning_rate": 1.7448902207475883e-05, "loss": 1.4016, "step": 9357 }, { "epoch": 0.26, "learning_rate": 1.7448312046592897e-05, "loss": 1.2571, "step": 9358 }, { "epoch": 0.26, "learning_rate": 1.744772182743782e-05, "loss": 1.3362, "step": 9359 }, { "epoch": 0.26, "learning_rate": 1.7447131550015273e-05, "loss": 1.3752, "step": 9360 }, { "epoch": 0.26, "learning_rate": 1.7446541214329865e-05, "loss": 1.2742, "step": 9361 }, { "epoch": 0.26, "learning_rate": 1.7445950820386224e-05, "loss": 1.3787, "step": 9362 }, { "epoch": 0.26, "learning_rate": 1.7445360368188967e-05, "loss": 1.4265, "step": 9363 }, { "epoch": 0.26, "learning_rate": 1.7444769857742708e-05, "loss": 1.3455, "step": 9364 }, { "epoch": 0.26, "learning_rate": 1.744417928905207e-05, "loss": 1.2942, "step": 9365 }, { "epoch": 0.26, "learning_rate": 1.7443588662121674e-05, "loss": 1.3247, "step": 9366 }, { "epoch": 0.26, "learning_rate": 1.7442997976956143e-05, "loss": 1.2935, "step": 9367 }, { "epoch": 0.26, "learning_rate": 1.7442407233560096e-05, "loss": 1.3669, "step": 9368 }, { "epoch": 0.26, "learning_rate": 1.7441816431938153e-05, "loss": 1.2776, "step": 9369 }, { "epoch": 0.26, "learning_rate": 1.7441225572094936e-05, "loss": 1.5508, "step": 9370 }, { "epoch": 0.26, "learning_rate": 1.744063465403507e-05, "loss": 1.3254, "step": 9371 }, { "epoch": 0.26, "learning_rate": 1.744004367776318e-05, "loss": 1.7129, "step": 9372 }, { "epoch": 0.26, "learning_rate": 1.7439452643283888e-05, "loss": 1.3591, "step": 9373 }, { "epoch": 0.26, "learning_rate": 1.743886155060181e-05, "loss": 1.395, "step": 9374 }, { "epoch": 0.26, "learning_rate": 1.7438270399721583e-05, "loss": 1.2576, "step": 9375 }, { "epoch": 0.26, "learning_rate": 1.7437679190647824e-05, "loss": 1.3801, "step": 9376 }, { "epoch": 0.26, "learning_rate": 1.7437087923385162e-05, "loss": 1.2969, "step": 9377 }, { "epoch": 0.26, "learning_rate": 1.743649659793822e-05, "loss": 1.2944, "step": 9378 }, { "epoch": 0.26, "learning_rate": 1.7435905214311625e-05, "loss": 1.3948, "step": 9379 }, { "epoch": 0.26, "learning_rate": 1.7435313772510004e-05, "loss": 1.3857, "step": 9380 }, { "epoch": 0.26, "learning_rate": 1.7434722272537985e-05, "loss": 1.4663, "step": 9381 }, { "epoch": 0.26, "learning_rate": 1.7434130714400193e-05, "loss": 1.209, "step": 9382 }, { "epoch": 0.26, "learning_rate": 1.743353909810126e-05, "loss": 1.3484, "step": 9383 }, { "epoch": 0.26, "learning_rate": 1.7432947423645815e-05, "loss": 1.1201, "step": 9384 }, { "epoch": 0.26, "learning_rate": 1.743235569103848e-05, "loss": 1.1499, "step": 9385 }, { "epoch": 0.26, "learning_rate": 1.7431763900283893e-05, "loss": 1.5254, "step": 9386 }, { "epoch": 0.26, "learning_rate": 1.7431172051386677e-05, "loss": 1.4419, "step": 9387 }, { "epoch": 0.26, "learning_rate": 1.7430580144351464e-05, "loss": 1.2292, "step": 9388 }, { "epoch": 0.26, "learning_rate": 1.7429988179182893e-05, "loss": 1.468, "step": 9389 }, { "epoch": 0.26, "learning_rate": 1.7429396155885584e-05, "loss": 1.085, "step": 9390 }, { "epoch": 0.26, "learning_rate": 1.7428804074464173e-05, "loss": 1.3208, "step": 9391 }, { "epoch": 0.26, "learning_rate": 1.7428211934923292e-05, "loss": 1.3726, "step": 9392 }, { "epoch": 0.26, "learning_rate": 1.742761973726757e-05, "loss": 1.384, "step": 9393 }, { "epoch": 0.26, "learning_rate": 1.742702748150165e-05, "loss": 1.2029, "step": 9394 }, { "epoch": 0.26, "learning_rate": 1.7426435167630157e-05, "loss": 1.3921, "step": 9395 }, { "epoch": 0.26, "learning_rate": 1.742584279565773e-05, "loss": 1.3838, "step": 9396 }, { "epoch": 0.26, "learning_rate": 1.7425250365588995e-05, "loss": 1.3867, "step": 9397 }, { "epoch": 0.26, "learning_rate": 1.7424657877428598e-05, "loss": 1.4851, "step": 9398 }, { "epoch": 0.26, "learning_rate": 1.7424065331181167e-05, "loss": 1.3652, "step": 9399 }, { "epoch": 0.26, "learning_rate": 1.742347272685134e-05, "loss": 1.2537, "step": 9400 }, { "epoch": 0.26, "learning_rate": 1.742288006444375e-05, "loss": 1.2969, "step": 9401 }, { "epoch": 0.26, "learning_rate": 1.7422287343963043e-05, "loss": 1.5198, "step": 9402 }, { "epoch": 0.26, "learning_rate": 1.742169456541385e-05, "loss": 1.231, "step": 9403 }, { "epoch": 0.26, "learning_rate": 1.7421101728800803e-05, "loss": 1.3796, "step": 9404 }, { "epoch": 0.26, "learning_rate": 1.7420508834128548e-05, "loss": 1.4106, "step": 9405 }, { "epoch": 0.26, "learning_rate": 1.7419915881401723e-05, "loss": 1.3103, "step": 9406 }, { "epoch": 0.26, "learning_rate": 1.7419322870624964e-05, "loss": 1.4741, "step": 9407 }, { "epoch": 0.26, "learning_rate": 1.741872980180291e-05, "loss": 1.2156, "step": 9408 }, { "epoch": 0.26, "learning_rate": 1.7418136674940203e-05, "loss": 1.1948, "step": 9409 }, { "epoch": 0.26, "learning_rate": 1.7417543490041487e-05, "loss": 1.3271, "step": 9410 }, { "epoch": 0.26, "learning_rate": 1.7416950247111396e-05, "loss": 1.366, "step": 9411 }, { "epoch": 0.26, "learning_rate": 1.7416356946154573e-05, "loss": 1.3894, "step": 9412 }, { "epoch": 0.26, "learning_rate": 1.741576358717566e-05, "loss": 1.2651, "step": 9413 }, { "epoch": 0.26, "learning_rate": 1.7415170170179304e-05, "loss": 1.3479, "step": 9414 }, { "epoch": 0.26, "learning_rate": 1.741457669517014e-05, "loss": 1.3745, "step": 9415 }, { "epoch": 0.26, "learning_rate": 1.7413983162152816e-05, "loss": 1.2507, "step": 9416 }, { "epoch": 0.26, "learning_rate": 1.741338957113197e-05, "loss": 1.4573, "step": 9417 }, { "epoch": 0.26, "learning_rate": 1.7412795922112254e-05, "loss": 1.356, "step": 9418 }, { "epoch": 0.26, "learning_rate": 1.741220221509831e-05, "loss": 1.2927, "step": 9419 }, { "epoch": 0.26, "learning_rate": 1.7411608450094778e-05, "loss": 1.3545, "step": 9420 }, { "epoch": 0.26, "learning_rate": 1.7411014627106306e-05, "loss": 1.4097, "step": 9421 }, { "epoch": 0.26, "learning_rate": 1.741042074613754e-05, "loss": 1.3621, "step": 9422 }, { "epoch": 0.26, "learning_rate": 1.7409826807193134e-05, "loss": 1.3965, "step": 9423 }, { "epoch": 0.26, "learning_rate": 1.7409232810277718e-05, "loss": 1.4021, "step": 9424 }, { "epoch": 0.26, "learning_rate": 1.7408638755395955e-05, "loss": 1.5161, "step": 9425 }, { "epoch": 0.26, "learning_rate": 1.7408044642552486e-05, "loss": 1.4055, "step": 9426 }, { "epoch": 0.26, "learning_rate": 1.7407450471751953e-05, "loss": 1.2844, "step": 9427 }, { "epoch": 0.26, "learning_rate": 1.7406856242999018e-05, "loss": 1.7759, "step": 9428 }, { "epoch": 0.26, "learning_rate": 1.7406261956298317e-05, "loss": 1.3733, "step": 9429 }, { "epoch": 0.26, "learning_rate": 1.740566761165451e-05, "loss": 1.5566, "step": 9430 }, { "epoch": 0.26, "learning_rate": 1.740507320907224e-05, "loss": 1.438, "step": 9431 }, { "epoch": 0.26, "learning_rate": 1.7404478748556157e-05, "loss": 1.3625, "step": 9432 }, { "epoch": 0.26, "learning_rate": 1.7403884230110917e-05, "loss": 1.2305, "step": 9433 }, { "epoch": 0.26, "learning_rate": 1.7403289653741167e-05, "loss": 1.4038, "step": 9434 }, { "epoch": 0.26, "learning_rate": 1.740269501945156e-05, "loss": 1.2495, "step": 9435 }, { "epoch": 0.26, "learning_rate": 1.7402100327246748e-05, "loss": 1.407, "step": 9436 }, { "epoch": 0.26, "learning_rate": 1.7401505577131387e-05, "loss": 1.2466, "step": 9437 }, { "epoch": 0.26, "learning_rate": 1.7400910769110123e-05, "loss": 1.4163, "step": 9438 }, { "epoch": 0.26, "learning_rate": 1.7400315903187618e-05, "loss": 1.3184, "step": 9439 }, { "epoch": 0.26, "learning_rate": 1.7399720979368517e-05, "loss": 1.2795, "step": 9440 }, { "epoch": 0.26, "learning_rate": 1.7399125997657478e-05, "loss": 1.4497, "step": 9441 }, { "epoch": 0.26, "learning_rate": 1.7398530958059158e-05, "loss": 1.3638, "step": 9442 }, { "epoch": 0.26, "learning_rate": 1.739793586057821e-05, "loss": 1.3206, "step": 9443 }, { "epoch": 0.26, "learning_rate": 1.7397340705219293e-05, "loss": 1.3213, "step": 9444 }, { "epoch": 0.26, "learning_rate": 1.7396745491987058e-05, "loss": 1.2454, "step": 9445 }, { "epoch": 0.26, "learning_rate": 1.7396150220886167e-05, "loss": 1.4873, "step": 9446 }, { "epoch": 0.26, "learning_rate": 1.7395554891921273e-05, "loss": 1.4102, "step": 9447 }, { "epoch": 0.26, "learning_rate": 1.7394959505097032e-05, "loss": 1.3169, "step": 9448 }, { "epoch": 0.26, "learning_rate": 1.739436406041811e-05, "loss": 1.3779, "step": 9449 }, { "epoch": 0.26, "learning_rate": 1.7393768557889162e-05, "loss": 1.2214, "step": 9450 }, { "epoch": 0.26, "learning_rate": 1.739317299751484e-05, "loss": 1.2896, "step": 9451 }, { "epoch": 0.26, "learning_rate": 1.7392577379299813e-05, "loss": 1.261, "step": 9452 }, { "epoch": 0.26, "learning_rate": 1.7391981703248735e-05, "loss": 1.2559, "step": 9453 }, { "epoch": 0.26, "learning_rate": 1.739138596936627e-05, "loss": 1.321, "step": 9454 }, { "epoch": 0.26, "learning_rate": 1.7390790177657075e-05, "loss": 1.3323, "step": 9455 }, { "epoch": 0.26, "learning_rate": 1.7390194328125814e-05, "loss": 1.3867, "step": 9456 }, { "epoch": 0.26, "learning_rate": 1.7389598420777147e-05, "loss": 1.1926, "step": 9457 }, { "epoch": 0.26, "learning_rate": 1.7389002455615737e-05, "loss": 1.2434, "step": 9458 }, { "epoch": 0.26, "learning_rate": 1.7388406432646246e-05, "loss": 1.2803, "step": 9459 }, { "epoch": 0.26, "learning_rate": 1.738781035187334e-05, "loss": 1.4128, "step": 9460 }, { "epoch": 0.26, "learning_rate": 1.7387214213301677e-05, "loss": 1.3177, "step": 9461 }, { "epoch": 0.26, "learning_rate": 1.7386618016935925e-05, "loss": 1.46, "step": 9462 }, { "epoch": 0.26, "learning_rate": 1.7386021762780745e-05, "loss": 1.4836, "step": 9463 }, { "epoch": 0.26, "learning_rate": 1.7385425450840804e-05, "loss": 1.3833, "step": 9464 }, { "epoch": 0.26, "learning_rate": 1.738482908112077e-05, "loss": 1.3633, "step": 9465 }, { "epoch": 0.26, "learning_rate": 1.7384232653625303e-05, "loss": 1.334, "step": 9466 }, { "epoch": 0.26, "learning_rate": 1.7383636168359077e-05, "loss": 1.407, "step": 9467 }, { "epoch": 0.26, "learning_rate": 1.738303962532675e-05, "loss": 1.3997, "step": 9468 }, { "epoch": 0.26, "learning_rate": 1.738244302453299e-05, "loss": 1.1772, "step": 9469 }, { "epoch": 0.26, "learning_rate": 1.738184636598247e-05, "loss": 1.4585, "step": 9470 }, { "epoch": 0.26, "learning_rate": 1.7381249649679854e-05, "loss": 1.3379, "step": 9471 }, { "epoch": 0.26, "learning_rate": 1.7380652875629813e-05, "loss": 1.4336, "step": 9472 }, { "epoch": 0.26, "learning_rate": 1.7380056043837014e-05, "loss": 1.3059, "step": 9473 }, { "epoch": 0.26, "learning_rate": 1.737945915430613e-05, "loss": 1.4524, "step": 9474 }, { "epoch": 0.26, "learning_rate": 1.7378862207041822e-05, "loss": 1.4658, "step": 9475 }, { "epoch": 0.26, "learning_rate": 1.737826520204877e-05, "loss": 1.3201, "step": 9476 }, { "epoch": 0.26, "learning_rate": 1.7377668139331638e-05, "loss": 1.4463, "step": 9477 }, { "epoch": 0.26, "learning_rate": 1.7377071018895103e-05, "loss": 1.4104, "step": 9478 }, { "epoch": 0.26, "learning_rate": 1.737647384074383e-05, "loss": 1.3225, "step": 9479 }, { "epoch": 0.26, "learning_rate": 1.7375876604882496e-05, "loss": 1.4487, "step": 9480 }, { "epoch": 0.26, "learning_rate": 1.737527931131577e-05, "loss": 1.2214, "step": 9481 }, { "epoch": 0.26, "learning_rate": 1.7374681960048328e-05, "loss": 1.3777, "step": 9482 }, { "epoch": 0.26, "learning_rate": 1.7374084551084843e-05, "loss": 1.394, "step": 9483 }, { "epoch": 0.26, "learning_rate": 1.7373487084429988e-05, "loss": 1.3713, "step": 9484 }, { "epoch": 0.26, "learning_rate": 1.7372889560088438e-05, "loss": 1.4473, "step": 9485 }, { "epoch": 0.26, "learning_rate": 1.7372291978064867e-05, "loss": 1.2402, "step": 9486 }, { "epoch": 0.26, "learning_rate": 1.737169433836395e-05, "loss": 1.3254, "step": 9487 }, { "epoch": 0.26, "learning_rate": 1.7371096640990356e-05, "loss": 1.2354, "step": 9488 }, { "epoch": 0.26, "learning_rate": 1.7370498885948775e-05, "loss": 1.314, "step": 9489 }, { "epoch": 0.26, "learning_rate": 1.7369901073243878e-05, "loss": 1.4609, "step": 9490 }, { "epoch": 0.26, "learning_rate": 1.7369303202880337e-05, "loss": 1.3369, "step": 9491 }, { "epoch": 0.26, "learning_rate": 1.7368705274862834e-05, "loss": 1.4094, "step": 9492 }, { "epoch": 0.26, "learning_rate": 1.7368107289196045e-05, "loss": 1.2864, "step": 9493 }, { "epoch": 0.26, "learning_rate": 1.736750924588465e-05, "loss": 1.5625, "step": 9494 }, { "epoch": 0.26, "learning_rate": 1.7366911144933326e-05, "loss": 1.4224, "step": 9495 }, { "epoch": 0.26, "learning_rate": 1.7366312986346756e-05, "loss": 1.4144, "step": 9496 }, { "epoch": 0.26, "learning_rate": 1.7365714770129617e-05, "loss": 1.4038, "step": 9497 }, { "epoch": 0.26, "learning_rate": 1.7365116496286586e-05, "loss": 1.4307, "step": 9498 }, { "epoch": 0.26, "learning_rate": 1.736451816482235e-05, "loss": 1.3821, "step": 9499 }, { "epoch": 0.26, "learning_rate": 1.7363919775741586e-05, "loss": 1.344, "step": 9500 }, { "epoch": 0.26, "learning_rate": 1.7363321329048977e-05, "loss": 1.2932, "step": 9501 }, { "epoch": 0.26, "learning_rate": 1.7362722824749204e-05, "loss": 1.2405, "step": 9502 }, { "epoch": 0.26, "learning_rate": 1.7362124262846948e-05, "loss": 1.478, "step": 9503 }, { "epoch": 0.26, "learning_rate": 1.73615256433469e-05, "loss": 1.4238, "step": 9504 }, { "epoch": 0.26, "learning_rate": 1.736092696625373e-05, "loss": 1.3394, "step": 9505 }, { "epoch": 0.26, "learning_rate": 1.736032823157213e-05, "loss": 1.2979, "step": 9506 }, { "epoch": 0.26, "learning_rate": 1.7359729439306786e-05, "loss": 1.1792, "step": 9507 }, { "epoch": 0.26, "learning_rate": 1.7359130589462378e-05, "loss": 1.4385, "step": 9508 }, { "epoch": 0.26, "learning_rate": 1.735853168204359e-05, "loss": 1.481, "step": 9509 }, { "epoch": 0.26, "learning_rate": 1.7357932717055114e-05, "loss": 1.7798, "step": 9510 }, { "epoch": 0.26, "learning_rate": 1.7357333694501627e-05, "loss": 1.0889, "step": 9511 }, { "epoch": 0.26, "learning_rate": 1.7356734614387826e-05, "loss": 1.3657, "step": 9512 }, { "epoch": 0.26, "learning_rate": 1.7356135476718393e-05, "loss": 1.3999, "step": 9513 }, { "epoch": 0.26, "learning_rate": 1.7355536281498015e-05, "loss": 1.3804, "step": 9514 }, { "epoch": 0.26, "learning_rate": 1.7354937028731378e-05, "loss": 1.3413, "step": 9515 }, { "epoch": 0.26, "learning_rate": 1.7354337718423173e-05, "loss": 1.2563, "step": 9516 }, { "epoch": 0.26, "learning_rate": 1.7353738350578087e-05, "loss": 1.3486, "step": 9517 }, { "epoch": 0.26, "learning_rate": 1.7353138925200812e-05, "loss": 1.5547, "step": 9518 }, { "epoch": 0.26, "learning_rate": 1.7352539442296035e-05, "loss": 1.4561, "step": 9519 }, { "epoch": 0.26, "learning_rate": 1.7351939901868446e-05, "loss": 1.2654, "step": 9520 }, { "epoch": 0.26, "learning_rate": 1.7351340303922737e-05, "loss": 1.1925, "step": 9521 }, { "epoch": 0.26, "learning_rate": 1.73507406484636e-05, "loss": 1.1611, "step": 9522 }, { "epoch": 0.26, "learning_rate": 1.7350140935495724e-05, "loss": 1.3347, "step": 9523 }, { "epoch": 0.26, "learning_rate": 1.7349541165023796e-05, "loss": 1.2212, "step": 9524 }, { "epoch": 0.26, "learning_rate": 1.734894133705252e-05, "loss": 1.4023, "step": 9525 }, { "epoch": 0.26, "learning_rate": 1.734834145158658e-05, "loss": 1.4106, "step": 9526 }, { "epoch": 0.26, "learning_rate": 1.7347741508630673e-05, "loss": 1.1315, "step": 9527 }, { "epoch": 0.26, "learning_rate": 1.7347141508189493e-05, "loss": 1.3577, "step": 9528 }, { "epoch": 0.26, "learning_rate": 1.7346541450267732e-05, "loss": 1.3486, "step": 9529 }, { "epoch": 0.26, "learning_rate": 1.7345941334870083e-05, "loss": 1.3354, "step": 9530 }, { "epoch": 0.26, "learning_rate": 1.7345341162001245e-05, "loss": 1.302, "step": 9531 }, { "epoch": 0.26, "learning_rate": 1.7344740931665914e-05, "loss": 1.5117, "step": 9532 }, { "epoch": 0.26, "learning_rate": 1.734414064386878e-05, "loss": 1.4426, "step": 9533 }, { "epoch": 0.26, "learning_rate": 1.7343540298614544e-05, "loss": 1.3247, "step": 9534 }, { "epoch": 0.26, "learning_rate": 1.7342939895907903e-05, "loss": 1.4062, "step": 9535 }, { "epoch": 0.26, "learning_rate": 1.7342339435753554e-05, "loss": 1.4214, "step": 9536 }, { "epoch": 0.26, "learning_rate": 1.734173891815619e-05, "loss": 1.5308, "step": 9537 }, { "epoch": 0.26, "learning_rate": 1.7341138343120517e-05, "loss": 1.4883, "step": 9538 }, { "epoch": 0.26, "learning_rate": 1.734053771065123e-05, "loss": 1.5103, "step": 9539 }, { "epoch": 0.26, "learning_rate": 1.7339937020753023e-05, "loss": 1.4619, "step": 9540 }, { "epoch": 0.26, "learning_rate": 1.73393362734306e-05, "loss": 1.3232, "step": 9541 }, { "epoch": 0.26, "learning_rate": 1.733873546868867e-05, "loss": 1.3503, "step": 9542 }, { "epoch": 0.26, "learning_rate": 1.7338134606531917e-05, "loss": 1.3186, "step": 9543 }, { "epoch": 0.26, "learning_rate": 1.733753368696505e-05, "loss": 1.2734, "step": 9544 }, { "epoch": 0.26, "learning_rate": 1.733693270999277e-05, "loss": 1.4104, "step": 9545 }, { "epoch": 0.26, "learning_rate": 1.733633167561978e-05, "loss": 1.219, "step": 9546 }, { "epoch": 0.26, "learning_rate": 1.733573058385078e-05, "loss": 1.2739, "step": 9547 }, { "epoch": 0.26, "learning_rate": 1.7335129434690477e-05, "loss": 1.4263, "step": 9548 }, { "epoch": 0.26, "learning_rate": 1.7334528228143565e-05, "loss": 1.491, "step": 9549 }, { "epoch": 0.26, "learning_rate": 1.7333926964214756e-05, "loss": 1.2742, "step": 9550 }, { "epoch": 0.26, "learning_rate": 1.7333325642908748e-05, "loss": 1.3013, "step": 9551 }, { "epoch": 0.26, "learning_rate": 1.7332724264230254e-05, "loss": 1.4341, "step": 9552 }, { "epoch": 0.26, "learning_rate": 1.7332122828183967e-05, "loss": 1.3293, "step": 9553 }, { "epoch": 0.26, "learning_rate": 1.7331521334774603e-05, "loss": 1.458, "step": 9554 }, { "epoch": 0.26, "learning_rate": 1.7330919784006864e-05, "loss": 1.4895, "step": 9555 }, { "epoch": 0.26, "learning_rate": 1.7330318175885455e-05, "loss": 1.3091, "step": 9556 }, { "epoch": 0.26, "learning_rate": 1.7329716510415083e-05, "loss": 1.3589, "step": 9557 }, { "epoch": 0.26, "learning_rate": 1.7329114787600455e-05, "loss": 1.2708, "step": 9558 }, { "epoch": 0.26, "learning_rate": 1.732851300744628e-05, "loss": 1.3518, "step": 9559 }, { "epoch": 0.26, "learning_rate": 1.7327911169957267e-05, "loss": 1.4385, "step": 9560 }, { "epoch": 0.26, "learning_rate": 1.732730927513812e-05, "loss": 1.353, "step": 9561 }, { "epoch": 0.26, "learning_rate": 1.7326707322993555e-05, "loss": 1.3467, "step": 9562 }, { "epoch": 0.26, "learning_rate": 1.7326105313528273e-05, "loss": 1.2725, "step": 9563 }, { "epoch": 0.26, "learning_rate": 1.732550324674699e-05, "loss": 1.3389, "step": 9564 }, { "epoch": 0.26, "learning_rate": 1.7324901122654413e-05, "loss": 1.2205, "step": 9565 }, { "epoch": 0.26, "learning_rate": 1.7324298941255257e-05, "loss": 1.3501, "step": 9566 }, { "epoch": 0.26, "learning_rate": 1.7323696702554226e-05, "loss": 1.4844, "step": 9567 }, { "epoch": 0.26, "learning_rate": 1.732309440655604e-05, "loss": 1.2979, "step": 9568 }, { "epoch": 0.26, "learning_rate": 1.7322492053265403e-05, "loss": 1.3491, "step": 9569 }, { "epoch": 0.26, "learning_rate": 1.7321889642687032e-05, "loss": 1.3853, "step": 9570 }, { "epoch": 0.26, "learning_rate": 1.732128717482564e-05, "loss": 1.3682, "step": 9571 }, { "epoch": 0.26, "learning_rate": 1.732068464968594e-05, "loss": 1.2324, "step": 9572 }, { "epoch": 0.26, "learning_rate": 1.732008206727265e-05, "loss": 1.3865, "step": 9573 }, { "epoch": 0.26, "learning_rate": 1.7319479427590473e-05, "loss": 1.4509, "step": 9574 }, { "epoch": 0.26, "learning_rate": 1.7318876730644138e-05, "loss": 1.4399, "step": 9575 }, { "epoch": 0.26, "learning_rate": 1.7318273976438347e-05, "loss": 1.4858, "step": 9576 }, { "epoch": 0.26, "learning_rate": 1.7317671164977823e-05, "loss": 1.4287, "step": 9577 }, { "epoch": 0.26, "learning_rate": 1.7317068296267283e-05, "loss": 1.3604, "step": 9578 }, { "epoch": 0.26, "learning_rate": 1.731646537031144e-05, "loss": 1.469, "step": 9579 }, { "epoch": 0.26, "learning_rate": 1.731586238711501e-05, "loss": 1.3774, "step": 9580 }, { "epoch": 0.26, "learning_rate": 1.7315259346682716e-05, "loss": 1.187, "step": 9581 }, { "epoch": 0.26, "learning_rate": 1.7314656249019272e-05, "loss": 1.244, "step": 9582 }, { "epoch": 0.26, "learning_rate": 1.7314053094129398e-05, "loss": 1.7524, "step": 9583 }, { "epoch": 0.26, "learning_rate": 1.731344988201781e-05, "loss": 1.3142, "step": 9584 }, { "epoch": 0.26, "learning_rate": 1.7312846612689228e-05, "loss": 1.4856, "step": 9585 }, { "epoch": 0.26, "learning_rate": 1.7312243286148378e-05, "loss": 1.2288, "step": 9586 }, { "epoch": 0.26, "learning_rate": 1.731163990239997e-05, "loss": 1.5679, "step": 9587 }, { "epoch": 0.26, "learning_rate": 1.7311036461448733e-05, "loss": 1.3435, "step": 9588 }, { "epoch": 0.26, "learning_rate": 1.731043296329938e-05, "loss": 1.3267, "step": 9589 }, { "epoch": 0.26, "learning_rate": 1.7309829407956642e-05, "loss": 1.2886, "step": 9590 }, { "epoch": 0.26, "learning_rate": 1.7309225795425234e-05, "loss": 1.3916, "step": 9591 }, { "epoch": 0.26, "learning_rate": 1.7308622125709883e-05, "loss": 1.241, "step": 9592 }, { "epoch": 0.26, "learning_rate": 1.7308018398815306e-05, "loss": 1.407, "step": 9593 }, { "epoch": 0.26, "learning_rate": 1.730741461474623e-05, "loss": 1.4624, "step": 9594 }, { "epoch": 0.26, "learning_rate": 1.7306810773507376e-05, "loss": 1.4121, "step": 9595 }, { "epoch": 0.26, "learning_rate": 1.7306206875103474e-05, "loss": 1.3406, "step": 9596 }, { "epoch": 0.26, "learning_rate": 1.7305602919539243e-05, "loss": 1.3928, "step": 9597 }, { "epoch": 0.26, "learning_rate": 1.730499890681941e-05, "loss": 1.4116, "step": 9598 }, { "epoch": 0.26, "learning_rate": 1.7304394836948705e-05, "loss": 1.3958, "step": 9599 }, { "epoch": 0.26, "learning_rate": 1.7303790709931847e-05, "loss": 1.3535, "step": 9600 }, { "epoch": 0.26, "learning_rate": 1.7303186525773563e-05, "loss": 1.3616, "step": 9601 }, { "epoch": 0.26, "learning_rate": 1.7302582284478584e-05, "loss": 1.3779, "step": 9602 }, { "epoch": 0.26, "learning_rate": 1.7301977986051635e-05, "loss": 1.3237, "step": 9603 }, { "epoch": 0.26, "learning_rate": 1.730137363049744e-05, "loss": 1.4685, "step": 9604 }, { "epoch": 0.26, "learning_rate": 1.7300769217820737e-05, "loss": 1.3438, "step": 9605 }, { "epoch": 0.26, "learning_rate": 1.7300164748026243e-05, "loss": 1.334, "step": 9606 }, { "epoch": 0.26, "learning_rate": 1.72995602211187e-05, "loss": 1.2969, "step": 9607 }, { "epoch": 0.26, "learning_rate": 1.7298955637102826e-05, "loss": 1.3174, "step": 9608 }, { "epoch": 0.26, "learning_rate": 1.7298350995983356e-05, "loss": 1.4175, "step": 9609 }, { "epoch": 0.26, "learning_rate": 1.7297746297765018e-05, "loss": 1.3076, "step": 9610 }, { "epoch": 0.26, "learning_rate": 1.7297141542452544e-05, "loss": 1.3215, "step": 9611 }, { "epoch": 0.26, "learning_rate": 1.7296536730050668e-05, "loss": 1.3108, "step": 9612 }, { "epoch": 0.26, "learning_rate": 1.729593186056412e-05, "loss": 1.3196, "step": 9613 }, { "epoch": 0.26, "learning_rate": 1.7295326933997628e-05, "loss": 1.5352, "step": 9614 }, { "epoch": 0.26, "learning_rate": 1.7294721950355933e-05, "loss": 1.8608, "step": 9615 }, { "epoch": 0.26, "learning_rate": 1.7294116909643764e-05, "loss": 1.2704, "step": 9616 }, { "epoch": 0.26, "learning_rate": 1.7293511811865853e-05, "loss": 1.2451, "step": 9617 }, { "epoch": 0.26, "learning_rate": 1.7292906657026935e-05, "loss": 1.3591, "step": 9618 }, { "epoch": 0.26, "learning_rate": 1.729230144513174e-05, "loss": 1.314, "step": 9619 }, { "epoch": 0.26, "learning_rate": 1.7291696176185016e-05, "loss": 1.5225, "step": 9620 }, { "epoch": 0.26, "learning_rate": 1.7291090850191486e-05, "loss": 1.2471, "step": 9621 }, { "epoch": 0.26, "learning_rate": 1.729048546715589e-05, "loss": 1.3711, "step": 9622 }, { "epoch": 0.26, "learning_rate": 1.7289880027082964e-05, "loss": 1.5479, "step": 9623 }, { "epoch": 0.26, "learning_rate": 1.7289274529977446e-05, "loss": 1.2883, "step": 9624 }, { "epoch": 0.26, "learning_rate": 1.7288668975844068e-05, "loss": 1.4236, "step": 9625 }, { "epoch": 0.26, "learning_rate": 1.7288063364687572e-05, "loss": 1.4163, "step": 9626 }, { "epoch": 0.26, "learning_rate": 1.7287457696512698e-05, "loss": 1.2952, "step": 9627 }, { "epoch": 0.26, "learning_rate": 1.728685197132418e-05, "loss": 1.4644, "step": 9628 }, { "epoch": 0.26, "learning_rate": 1.728624618912676e-05, "loss": 1.2847, "step": 9629 }, { "epoch": 0.26, "learning_rate": 1.7285640349925176e-05, "loss": 1.187, "step": 9630 }, { "epoch": 0.26, "learning_rate": 1.7285034453724167e-05, "loss": 1.5112, "step": 9631 }, { "epoch": 0.26, "learning_rate": 1.7284428500528475e-05, "loss": 1.2002, "step": 9632 }, { "epoch": 0.26, "learning_rate": 1.728382249034284e-05, "loss": 1.2263, "step": 9633 }, { "epoch": 0.26, "learning_rate": 1.7283216423171997e-05, "loss": 1.3247, "step": 9634 }, { "epoch": 0.26, "learning_rate": 1.7282610299020703e-05, "loss": 1.1016, "step": 9635 }, { "epoch": 0.26, "learning_rate": 1.7282004117893684e-05, "loss": 1.2947, "step": 9636 }, { "epoch": 0.26, "learning_rate": 1.728139787979569e-05, "loss": 1.4004, "step": 9637 }, { "epoch": 0.26, "learning_rate": 1.7280791584731466e-05, "loss": 1.4062, "step": 9638 }, { "epoch": 0.26, "learning_rate": 1.7280185232705748e-05, "loss": 1.3191, "step": 9639 }, { "epoch": 0.26, "learning_rate": 1.7279578823723288e-05, "loss": 1.3599, "step": 9640 }, { "epoch": 0.26, "learning_rate": 1.7278972357788823e-05, "loss": 1.449, "step": 9641 }, { "epoch": 0.26, "learning_rate": 1.7278365834907106e-05, "loss": 1.2695, "step": 9642 }, { "epoch": 0.26, "learning_rate": 1.727775925508287e-05, "loss": 1.2319, "step": 9643 }, { "epoch": 0.26, "learning_rate": 1.7277152618320875e-05, "loss": 1.4297, "step": 9644 }, { "epoch": 0.26, "learning_rate": 1.7276545924625857e-05, "loss": 1.4087, "step": 9645 }, { "epoch": 0.26, "learning_rate": 1.7275939174002565e-05, "loss": 1.3962, "step": 9646 }, { "epoch": 0.26, "learning_rate": 1.7275332366455745e-05, "loss": 1.2703, "step": 9647 }, { "epoch": 0.26, "learning_rate": 1.7274725501990147e-05, "loss": 1.3042, "step": 9648 }, { "epoch": 0.26, "learning_rate": 1.7274118580610518e-05, "loss": 1.3337, "step": 9649 }, { "epoch": 0.26, "learning_rate": 1.7273511602321605e-05, "loss": 1.4016, "step": 9650 }, { "epoch": 0.26, "learning_rate": 1.7272904567128158e-05, "loss": 1.396, "step": 9651 }, { "epoch": 0.26, "learning_rate": 1.7272297475034924e-05, "loss": 1.4578, "step": 9652 }, { "epoch": 0.26, "learning_rate": 1.7271690326046656e-05, "loss": 1.4443, "step": 9653 }, { "epoch": 0.26, "learning_rate": 1.72710831201681e-05, "loss": 1.3142, "step": 9654 }, { "epoch": 0.26, "learning_rate": 1.7270475857404014e-05, "loss": 1.446, "step": 9655 }, { "epoch": 0.26, "learning_rate": 1.726986853775914e-05, "loss": 1.4009, "step": 9656 }, { "epoch": 0.26, "learning_rate": 1.7269261161238235e-05, "loss": 1.3242, "step": 9657 }, { "epoch": 0.26, "learning_rate": 1.7268653727846044e-05, "loss": 1.4253, "step": 9658 }, { "epoch": 0.26, "learning_rate": 1.7268046237587328e-05, "loss": 1.3821, "step": 9659 }, { "epoch": 0.26, "learning_rate": 1.7267438690466836e-05, "loss": 1.3137, "step": 9660 }, { "epoch": 0.26, "learning_rate": 1.726683108648932e-05, "loss": 1.3687, "step": 9661 }, { "epoch": 0.26, "learning_rate": 1.7266223425659535e-05, "loss": 1.4766, "step": 9662 }, { "epoch": 0.26, "learning_rate": 1.7265615707982237e-05, "loss": 1.3833, "step": 9663 }, { "epoch": 0.26, "learning_rate": 1.7265007933462174e-05, "loss": 1.2517, "step": 9664 }, { "epoch": 0.26, "learning_rate": 1.726440010210411e-05, "loss": 1.4121, "step": 9665 }, { "epoch": 0.26, "learning_rate": 1.7263792213912794e-05, "loss": 1.4204, "step": 9666 }, { "epoch": 0.26, "learning_rate": 1.726318426889298e-05, "loss": 1.4219, "step": 9667 }, { "epoch": 0.26, "learning_rate": 1.726257626704943e-05, "loss": 1.3381, "step": 9668 }, { "epoch": 0.26, "learning_rate": 1.7261968208386897e-05, "loss": 1.4788, "step": 9669 }, { "epoch": 0.26, "learning_rate": 1.7261360092910144e-05, "loss": 1.5142, "step": 9670 }, { "epoch": 0.26, "learning_rate": 1.726075192062392e-05, "loss": 1.3909, "step": 9671 }, { "epoch": 0.26, "learning_rate": 1.7260143691532987e-05, "loss": 1.2181, "step": 9672 }, { "epoch": 0.26, "learning_rate": 1.725953540564211e-05, "loss": 1.3811, "step": 9673 }, { "epoch": 0.26, "learning_rate": 1.7258927062956034e-05, "loss": 1.2871, "step": 9674 }, { "epoch": 0.26, "learning_rate": 1.7258318663479528e-05, "loss": 1.2947, "step": 9675 }, { "epoch": 0.26, "learning_rate": 1.725771020721735e-05, "loss": 1.3013, "step": 9676 }, { "epoch": 0.26, "learning_rate": 1.7257101694174262e-05, "loss": 1.2815, "step": 9677 }, { "epoch": 0.26, "learning_rate": 1.7256493124355022e-05, "loss": 1.3723, "step": 9678 }, { "epoch": 0.26, "learning_rate": 1.725588449776439e-05, "loss": 1.3967, "step": 9679 }, { "epoch": 0.26, "learning_rate": 1.7255275814407134e-05, "loss": 1.7485, "step": 9680 }, { "epoch": 0.26, "learning_rate": 1.7254667074288007e-05, "loss": 1.4302, "step": 9681 }, { "epoch": 0.26, "learning_rate": 1.7254058277411777e-05, "loss": 1.4434, "step": 9682 }, { "epoch": 0.26, "learning_rate": 1.725344942378321e-05, "loss": 1.259, "step": 9683 }, { "epoch": 0.26, "learning_rate": 1.7252840513407064e-05, "loss": 1.3687, "step": 9684 }, { "epoch": 0.26, "learning_rate": 1.72522315462881e-05, "loss": 1.8408, "step": 9685 }, { "epoch": 0.26, "learning_rate": 1.7251622522431093e-05, "loss": 1.1978, "step": 9686 }, { "epoch": 0.26, "learning_rate": 1.7251013441840795e-05, "loss": 1.2046, "step": 9687 }, { "epoch": 0.26, "learning_rate": 1.7250404304521983e-05, "loss": 1.4141, "step": 9688 }, { "epoch": 0.26, "learning_rate": 1.7249795110479414e-05, "loss": 1.3569, "step": 9689 }, { "epoch": 0.26, "learning_rate": 1.724918585971786e-05, "loss": 1.4636, "step": 9690 }, { "epoch": 0.26, "learning_rate": 1.724857655224208e-05, "loss": 1.4253, "step": 9691 }, { "epoch": 0.26, "learning_rate": 1.724796718805685e-05, "loss": 1.4568, "step": 9692 }, { "epoch": 0.26, "learning_rate": 1.724735776716693e-05, "loss": 1.3906, "step": 9693 }, { "epoch": 0.26, "learning_rate": 1.7246748289577092e-05, "loss": 1.4678, "step": 9694 }, { "epoch": 0.26, "learning_rate": 1.7246138755292104e-05, "loss": 1.3977, "step": 9695 }, { "epoch": 0.26, "learning_rate": 1.7245529164316733e-05, "loss": 1.3635, "step": 9696 }, { "epoch": 0.26, "learning_rate": 1.724491951665575e-05, "loss": 1.3831, "step": 9697 }, { "epoch": 0.26, "learning_rate": 1.724430981231392e-05, "loss": 1.3076, "step": 9698 }, { "epoch": 0.26, "learning_rate": 1.7243700051296016e-05, "loss": 1.2896, "step": 9699 }, { "epoch": 0.26, "learning_rate": 1.7243090233606815e-05, "loss": 1.4221, "step": 9700 }, { "epoch": 0.26, "learning_rate": 1.7242480359251076e-05, "loss": 1.4412, "step": 9701 }, { "epoch": 0.26, "learning_rate": 1.724187042823358e-05, "loss": 1.4019, "step": 9702 }, { "epoch": 0.26, "learning_rate": 1.7241260440559096e-05, "loss": 1.4302, "step": 9703 }, { "epoch": 0.27, "learning_rate": 1.7240650396232393e-05, "loss": 1.4102, "step": 9704 }, { "epoch": 0.27, "learning_rate": 1.7240040295258244e-05, "loss": 1.4609, "step": 9705 }, { "epoch": 0.27, "learning_rate": 1.723943013764143e-05, "loss": 1.7363, "step": 9706 }, { "epoch": 0.27, "learning_rate": 1.7238819923386713e-05, "loss": 1.2961, "step": 9707 }, { "epoch": 0.27, "learning_rate": 1.7238209652498876e-05, "loss": 1.4126, "step": 9708 }, { "epoch": 0.27, "learning_rate": 1.7237599324982692e-05, "loss": 1.3345, "step": 9709 }, { "epoch": 0.27, "learning_rate": 1.7236988940842932e-05, "loss": 1.3086, "step": 9710 }, { "epoch": 0.27, "learning_rate": 1.7236378500084372e-05, "loss": 1.4805, "step": 9711 }, { "epoch": 0.27, "learning_rate": 1.7235768002711794e-05, "loss": 1.3257, "step": 9712 }, { "epoch": 0.27, "learning_rate": 1.7235157448729967e-05, "loss": 1.5044, "step": 9713 }, { "epoch": 0.27, "learning_rate": 1.723454683814367e-05, "loss": 1.4214, "step": 9714 }, { "epoch": 0.27, "learning_rate": 1.7233936170957676e-05, "loss": 1.2869, "step": 9715 }, { "epoch": 0.27, "learning_rate": 1.7233325447176775e-05, "loss": 1.2517, "step": 9716 }, { "epoch": 0.27, "learning_rate": 1.7232714666805736e-05, "loss": 1.4126, "step": 9717 }, { "epoch": 0.27, "learning_rate": 1.723210382984933e-05, "loss": 1.4688, "step": 9718 }, { "epoch": 0.27, "learning_rate": 1.7231492936312352e-05, "loss": 1.4941, "step": 9719 }, { "epoch": 0.27, "learning_rate": 1.7230881986199572e-05, "loss": 1.3457, "step": 9720 }, { "epoch": 0.27, "learning_rate": 1.7230270979515773e-05, "loss": 1.3049, "step": 9721 }, { "epoch": 0.27, "learning_rate": 1.7229659916265734e-05, "loss": 1.3682, "step": 9722 }, { "epoch": 0.27, "learning_rate": 1.7229048796454237e-05, "loss": 1.3894, "step": 9723 }, { "epoch": 0.27, "learning_rate": 1.7228437620086055e-05, "loss": 1.2737, "step": 9724 }, { "epoch": 0.27, "learning_rate": 1.722782638716598e-05, "loss": 1.2952, "step": 9725 }, { "epoch": 0.27, "learning_rate": 1.7227215097698787e-05, "loss": 1.2778, "step": 9726 }, { "epoch": 0.27, "learning_rate": 1.7226603751689266e-05, "loss": 1.7017, "step": 9727 }, { "epoch": 0.27, "learning_rate": 1.7225992349142196e-05, "loss": 1.2864, "step": 9728 }, { "epoch": 0.27, "learning_rate": 1.7225380890062355e-05, "loss": 1.3479, "step": 9729 }, { "epoch": 0.27, "learning_rate": 1.7224769374454536e-05, "loss": 1.7627, "step": 9730 }, { "epoch": 0.27, "learning_rate": 1.7224157802323515e-05, "loss": 1.4565, "step": 9731 }, { "epoch": 0.27, "learning_rate": 1.7223546173674085e-05, "loss": 1.2427, "step": 9732 }, { "epoch": 0.27, "learning_rate": 1.7222934488511023e-05, "loss": 1.4282, "step": 9733 }, { "epoch": 0.27, "learning_rate": 1.7222322746839117e-05, "loss": 1.3052, "step": 9734 }, { "epoch": 0.27, "learning_rate": 1.7221710948663157e-05, "loss": 1.2969, "step": 9735 }, { "epoch": 0.27, "learning_rate": 1.7221099093987925e-05, "loss": 1.363, "step": 9736 }, { "epoch": 0.27, "learning_rate": 1.7220487182818208e-05, "loss": 1.3611, "step": 9737 }, { "epoch": 0.27, "learning_rate": 1.7219875215158795e-05, "loss": 1.3262, "step": 9738 }, { "epoch": 0.27, "learning_rate": 1.7219263191014476e-05, "loss": 1.3032, "step": 9739 }, { "epoch": 0.27, "learning_rate": 1.7218651110390037e-05, "loss": 1.3298, "step": 9740 }, { "epoch": 0.27, "learning_rate": 1.7218038973290263e-05, "loss": 1.7349, "step": 9741 }, { "epoch": 0.27, "learning_rate": 1.7217426779719947e-05, "loss": 1.2932, "step": 9742 }, { "epoch": 0.27, "learning_rate": 1.7216814529683877e-05, "loss": 1.3284, "step": 9743 }, { "epoch": 0.27, "learning_rate": 1.7216202223186848e-05, "loss": 1.2454, "step": 9744 }, { "epoch": 0.27, "learning_rate": 1.721558986023364e-05, "loss": 1.2632, "step": 9745 }, { "epoch": 0.27, "learning_rate": 1.7214977440829052e-05, "loss": 1.2979, "step": 9746 }, { "epoch": 0.27, "learning_rate": 1.7214364964977878e-05, "loss": 1.4146, "step": 9747 }, { "epoch": 0.27, "learning_rate": 1.7213752432684897e-05, "loss": 1.3035, "step": 9748 }, { "epoch": 0.27, "learning_rate": 1.7213139843954914e-05, "loss": 1.3005, "step": 9749 }, { "epoch": 0.27, "learning_rate": 1.7212527198792716e-05, "loss": 1.2446, "step": 9750 }, { "epoch": 0.27, "learning_rate": 1.7211914497203097e-05, "loss": 1.3665, "step": 9751 }, { "epoch": 0.27, "learning_rate": 1.721130173919085e-05, "loss": 1.4897, "step": 9752 }, { "epoch": 0.27, "learning_rate": 1.7210688924760768e-05, "loss": 1.3394, "step": 9753 }, { "epoch": 0.27, "learning_rate": 1.721007605391765e-05, "loss": 1.4473, "step": 9754 }, { "epoch": 0.27, "learning_rate": 1.7209463126666283e-05, "loss": 1.4736, "step": 9755 }, { "epoch": 0.27, "learning_rate": 1.7208850143011468e-05, "loss": 1.4316, "step": 9756 }, { "epoch": 0.27, "learning_rate": 1.7208237102958e-05, "loss": 1.4399, "step": 9757 }, { "epoch": 0.27, "learning_rate": 1.720762400651067e-05, "loss": 1.4287, "step": 9758 }, { "epoch": 0.27, "learning_rate": 1.720701085367429e-05, "loss": 1.4685, "step": 9759 }, { "epoch": 0.27, "learning_rate": 1.7206397644453637e-05, "loss": 1.4038, "step": 9760 }, { "epoch": 0.27, "learning_rate": 1.720578437885352e-05, "loss": 1.541, "step": 9761 }, { "epoch": 0.27, "learning_rate": 1.7205171056878733e-05, "loss": 1.2267, "step": 9762 }, { "epoch": 0.27, "learning_rate": 1.720455767853408e-05, "loss": 1.313, "step": 9763 }, { "epoch": 0.27, "learning_rate": 1.7203944243824353e-05, "loss": 1.3098, "step": 9764 }, { "epoch": 0.27, "learning_rate": 1.7203330752754352e-05, "loss": 1.5093, "step": 9765 }, { "epoch": 0.27, "learning_rate": 1.720271720532888e-05, "loss": 1.4175, "step": 9766 }, { "epoch": 0.27, "learning_rate": 1.7202103601552734e-05, "loss": 1.4341, "step": 9767 }, { "epoch": 0.27, "learning_rate": 1.720148994143072e-05, "loss": 1.3757, "step": 9768 }, { "epoch": 0.27, "learning_rate": 1.7200876224967632e-05, "loss": 1.3127, "step": 9769 }, { "epoch": 0.27, "learning_rate": 1.7200262452168276e-05, "loss": 1.4619, "step": 9770 }, { "epoch": 0.27, "learning_rate": 1.719964862303745e-05, "loss": 1.3799, "step": 9771 }, { "epoch": 0.27, "learning_rate": 1.7199034737579962e-05, "loss": 1.1736, "step": 9772 }, { "epoch": 0.27, "learning_rate": 1.719842079580061e-05, "loss": 1.354, "step": 9773 }, { "epoch": 0.27, "learning_rate": 1.7197806797704198e-05, "loss": 1.3174, "step": 9774 }, { "epoch": 0.27, "learning_rate": 1.719719274329553e-05, "loss": 1.2266, "step": 9775 }, { "epoch": 0.27, "learning_rate": 1.719657863257941e-05, "loss": 1.3196, "step": 9776 }, { "epoch": 0.27, "learning_rate": 1.7195964465560646e-05, "loss": 1.3684, "step": 9777 }, { "epoch": 0.27, "learning_rate": 1.7195350242244035e-05, "loss": 1.4624, "step": 9778 }, { "epoch": 0.27, "learning_rate": 1.719473596263439e-05, "loss": 1.3728, "step": 9779 }, { "epoch": 0.27, "learning_rate": 1.7194121626736513e-05, "loss": 1.2209, "step": 9780 }, { "epoch": 0.27, "learning_rate": 1.719350723455521e-05, "loss": 1.2925, "step": 9781 }, { "epoch": 0.27, "learning_rate": 1.7192892786095294e-05, "loss": 1.4128, "step": 9782 }, { "epoch": 0.27, "learning_rate": 1.7192278281361564e-05, "loss": 1.2339, "step": 9783 }, { "epoch": 0.27, "learning_rate": 1.719166372035883e-05, "loss": 1.2346, "step": 9784 }, { "epoch": 0.27, "learning_rate": 1.71910491030919e-05, "loss": 1.3021, "step": 9785 }, { "epoch": 0.27, "learning_rate": 1.7190434429565587e-05, "loss": 1.2583, "step": 9786 }, { "epoch": 0.27, "learning_rate": 1.7189819699784697e-05, "loss": 1.4431, "step": 9787 }, { "epoch": 0.27, "learning_rate": 1.7189204913754033e-05, "loss": 1.2666, "step": 9788 }, { "epoch": 0.27, "learning_rate": 1.7188590071478413e-05, "loss": 1.2678, "step": 9789 }, { "epoch": 0.27, "learning_rate": 1.7187975172962644e-05, "loss": 1.5591, "step": 9790 }, { "epoch": 0.27, "learning_rate": 1.7187360218211538e-05, "loss": 1.4199, "step": 9791 }, { "epoch": 0.27, "learning_rate": 1.7186745207229906e-05, "loss": 1.394, "step": 9792 }, { "epoch": 0.27, "learning_rate": 1.718613014002256e-05, "loss": 1.2808, "step": 9793 }, { "epoch": 0.27, "learning_rate": 1.7185515016594308e-05, "loss": 1.4331, "step": 9794 }, { "epoch": 0.27, "learning_rate": 1.7184899836949968e-05, "loss": 1.4475, "step": 9795 }, { "epoch": 0.27, "learning_rate": 1.7184284601094346e-05, "loss": 1.4148, "step": 9796 }, { "epoch": 0.27, "learning_rate": 1.7183669309032264e-05, "loss": 1.3193, "step": 9797 }, { "epoch": 0.27, "learning_rate": 1.718305396076853e-05, "loss": 1.3103, "step": 9798 }, { "epoch": 0.27, "learning_rate": 1.7182438556307957e-05, "loss": 1.2839, "step": 9799 }, { "epoch": 0.27, "learning_rate": 1.7181823095655365e-05, "loss": 1.4382, "step": 9800 }, { "epoch": 0.27, "learning_rate": 1.7181207578815567e-05, "loss": 1.3477, "step": 9801 }, { "epoch": 0.27, "learning_rate": 1.7180592005793378e-05, "loss": 1.3572, "step": 9802 }, { "epoch": 0.27, "learning_rate": 1.717997637659361e-05, "loss": 1.3027, "step": 9803 }, { "epoch": 0.27, "learning_rate": 1.7179360691221085e-05, "loss": 1.3733, "step": 9804 }, { "epoch": 0.27, "learning_rate": 1.717874494968062e-05, "loss": 1.3896, "step": 9805 }, { "epoch": 0.27, "learning_rate": 1.7178129151977027e-05, "loss": 1.2944, "step": 9806 }, { "epoch": 0.27, "learning_rate": 1.7177513298115128e-05, "loss": 1.3215, "step": 9807 }, { "epoch": 0.27, "learning_rate": 1.7176897388099742e-05, "loss": 1.3984, "step": 9808 }, { "epoch": 0.27, "learning_rate": 1.7176281421935685e-05, "loss": 1.2942, "step": 9809 }, { "epoch": 0.27, "learning_rate": 1.7175665399627776e-05, "loss": 1.3875, "step": 9810 }, { "epoch": 0.27, "learning_rate": 1.717504932118083e-05, "loss": 1.4087, "step": 9811 }, { "epoch": 0.27, "learning_rate": 1.717443318659968e-05, "loss": 1.2859, "step": 9812 }, { "epoch": 0.27, "learning_rate": 1.7173816995889137e-05, "loss": 1.375, "step": 9813 }, { "epoch": 0.27, "learning_rate": 1.717320074905402e-05, "loss": 1.2419, "step": 9814 }, { "epoch": 0.27, "learning_rate": 1.7172584446099153e-05, "loss": 1.3914, "step": 9815 }, { "epoch": 0.27, "learning_rate": 1.7171968087029362e-05, "loss": 1.3052, "step": 9816 }, { "epoch": 0.27, "learning_rate": 1.7171351671849463e-05, "loss": 1.2583, "step": 9817 }, { "epoch": 0.27, "learning_rate": 1.717073520056428e-05, "loss": 1.3594, "step": 9818 }, { "epoch": 0.27, "learning_rate": 1.7170118673178638e-05, "loss": 1.3142, "step": 9819 }, { "epoch": 0.27, "learning_rate": 1.716950208969736e-05, "loss": 1.3628, "step": 9820 }, { "epoch": 0.27, "learning_rate": 1.7168885450125268e-05, "loss": 1.3787, "step": 9821 }, { "epoch": 0.27, "learning_rate": 1.7168268754467186e-05, "loss": 1.4902, "step": 9822 }, { "epoch": 0.27, "learning_rate": 1.716765200272794e-05, "loss": 1.3804, "step": 9823 }, { "epoch": 0.27, "learning_rate": 1.7167035194912357e-05, "loss": 1.3501, "step": 9824 }, { "epoch": 0.27, "learning_rate": 1.716641833102526e-05, "loss": 1.3611, "step": 9825 }, { "epoch": 0.27, "learning_rate": 1.7165801411071476e-05, "loss": 1.4404, "step": 9826 }, { "epoch": 0.27, "learning_rate": 1.7165184435055833e-05, "loss": 1.4878, "step": 9827 }, { "epoch": 0.27, "learning_rate": 1.7164567402983153e-05, "loss": 1.2668, "step": 9828 }, { "epoch": 0.27, "learning_rate": 1.7163950314858267e-05, "loss": 1.4158, "step": 9829 }, { "epoch": 0.27, "learning_rate": 1.7163333170686005e-05, "loss": 1.3884, "step": 9830 }, { "epoch": 0.27, "learning_rate": 1.716271597047119e-05, "loss": 1.4636, "step": 9831 }, { "epoch": 0.27, "learning_rate": 1.7162098714218656e-05, "loss": 1.3691, "step": 9832 }, { "epoch": 0.27, "learning_rate": 1.716148140193323e-05, "loss": 1.1721, "step": 9833 }, { "epoch": 0.27, "learning_rate": 1.716086403361974e-05, "loss": 1.5137, "step": 9834 }, { "epoch": 0.27, "learning_rate": 1.7160246609283014e-05, "loss": 1.2212, "step": 9835 }, { "epoch": 0.27, "learning_rate": 1.7159629128927888e-05, "loss": 1.3872, "step": 9836 }, { "epoch": 0.27, "learning_rate": 1.715901159255919e-05, "loss": 1.3027, "step": 9837 }, { "epoch": 0.27, "learning_rate": 1.715839400018175e-05, "loss": 1.3289, "step": 9838 }, { "epoch": 0.27, "learning_rate": 1.7157776351800404e-05, "loss": 1.5413, "step": 9839 }, { "epoch": 0.27, "learning_rate": 1.7157158647419985e-05, "loss": 1.3533, "step": 9840 }, { "epoch": 0.27, "learning_rate": 1.7156540887045317e-05, "loss": 1.7681, "step": 9841 }, { "epoch": 0.27, "learning_rate": 1.715592307068124e-05, "loss": 1.4084, "step": 9842 }, { "epoch": 0.27, "learning_rate": 1.7155305198332587e-05, "loss": 1.1704, "step": 9843 }, { "epoch": 0.27, "learning_rate": 1.7154687270004188e-05, "loss": 1.4434, "step": 9844 }, { "epoch": 0.27, "learning_rate": 1.715406928570088e-05, "loss": 1.2646, "step": 9845 }, { "epoch": 0.27, "learning_rate": 1.7153451245427502e-05, "loss": 1.323, "step": 9846 }, { "epoch": 0.27, "learning_rate": 1.7152833149188882e-05, "loss": 1.2881, "step": 9847 }, { "epoch": 0.27, "learning_rate": 1.715221499698986e-05, "loss": 1.3511, "step": 9848 }, { "epoch": 0.27, "learning_rate": 1.715159678883527e-05, "loss": 1.771, "step": 9849 }, { "epoch": 0.27, "learning_rate": 1.715097852472995e-05, "loss": 1.395, "step": 9850 }, { "epoch": 0.27, "learning_rate": 1.7150360204678737e-05, "loss": 1.3599, "step": 9851 }, { "epoch": 0.27, "learning_rate": 1.714974182868647e-05, "loss": 1.1917, "step": 9852 }, { "epoch": 0.27, "learning_rate": 1.7149123396757982e-05, "loss": 1.4258, "step": 9853 }, { "epoch": 0.27, "learning_rate": 1.7148504908898114e-05, "loss": 1.3468, "step": 9854 }, { "epoch": 0.27, "learning_rate": 1.714788636511171e-05, "loss": 1.2742, "step": 9855 }, { "epoch": 0.27, "learning_rate": 1.71472677654036e-05, "loss": 1.3113, "step": 9856 }, { "epoch": 0.27, "learning_rate": 1.7146649109778624e-05, "loss": 1.3228, "step": 9857 }, { "epoch": 0.27, "learning_rate": 1.7146030398241634e-05, "loss": 1.4761, "step": 9858 }, { "epoch": 0.27, "learning_rate": 1.714541163079746e-05, "loss": 1.3105, "step": 9859 }, { "epoch": 0.27, "learning_rate": 1.7144792807450942e-05, "loss": 1.3721, "step": 9860 }, { "epoch": 0.27, "learning_rate": 1.7144173928206927e-05, "loss": 1.4875, "step": 9861 }, { "epoch": 0.27, "learning_rate": 1.7143554993070254e-05, "loss": 1.0955, "step": 9862 }, { "epoch": 0.27, "learning_rate": 1.7142936002045767e-05, "loss": 1.5444, "step": 9863 }, { "epoch": 0.27, "learning_rate": 1.714231695513831e-05, "loss": 1.364, "step": 9864 }, { "epoch": 0.27, "learning_rate": 1.714169785235272e-05, "loss": 1.3677, "step": 9865 }, { "epoch": 0.27, "learning_rate": 1.7141078693693845e-05, "loss": 1.2788, "step": 9866 }, { "epoch": 0.27, "learning_rate": 1.714045947916653e-05, "loss": 1.3501, "step": 9867 }, { "epoch": 0.27, "learning_rate": 1.7139840208775614e-05, "loss": 1.3928, "step": 9868 }, { "epoch": 0.27, "learning_rate": 1.713922088252595e-05, "loss": 1.282, "step": 9869 }, { "epoch": 0.27, "learning_rate": 1.7138601500422378e-05, "loss": 1.3716, "step": 9870 }, { "epoch": 0.27, "learning_rate": 1.713798206246974e-05, "loss": 1.262, "step": 9871 }, { "epoch": 0.27, "learning_rate": 1.713736256867289e-05, "loss": 1.2651, "step": 9872 }, { "epoch": 0.27, "learning_rate": 1.713674301903667e-05, "loss": 1.3079, "step": 9873 }, { "epoch": 0.27, "learning_rate": 1.7136123413565933e-05, "loss": 1.3252, "step": 9874 }, { "epoch": 0.27, "learning_rate": 1.7135503752265523e-05, "loss": 1.4121, "step": 9875 }, { "epoch": 0.27, "learning_rate": 1.713488403514028e-05, "loss": 1.3914, "step": 9876 }, { "epoch": 0.27, "learning_rate": 1.7134264262195066e-05, "loss": 1.449, "step": 9877 }, { "epoch": 0.27, "learning_rate": 1.7133644433434716e-05, "loss": 1.228, "step": 9878 }, { "epoch": 0.27, "learning_rate": 1.713302454886409e-05, "loss": 1.481, "step": 9879 }, { "epoch": 0.27, "learning_rate": 1.7132404608488035e-05, "loss": 1.4937, "step": 9880 }, { "epoch": 0.27, "learning_rate": 1.71317846123114e-05, "loss": 1.4114, "step": 9881 }, { "epoch": 0.27, "learning_rate": 1.7131164560339038e-05, "loss": 1.2405, "step": 9882 }, { "epoch": 0.27, "learning_rate": 1.7130544452575794e-05, "loss": 1.4773, "step": 9883 }, { "epoch": 0.27, "learning_rate": 1.7129924289026526e-05, "loss": 1.364, "step": 9884 }, { "epoch": 0.27, "learning_rate": 1.712930406969608e-05, "loss": 1.4067, "step": 9885 }, { "epoch": 0.27, "learning_rate": 1.7128683794589313e-05, "loss": 1.4673, "step": 9886 }, { "epoch": 0.27, "learning_rate": 1.7128063463711075e-05, "loss": 1.4641, "step": 9887 }, { "epoch": 0.27, "learning_rate": 1.7127443077066224e-05, "loss": 1.2234, "step": 9888 }, { "epoch": 0.27, "learning_rate": 1.712682263465961e-05, "loss": 1.3633, "step": 9889 }, { "epoch": 0.27, "learning_rate": 1.712620213649608e-05, "loss": 1.4219, "step": 9890 }, { "epoch": 0.27, "learning_rate": 1.7125581582580498e-05, "loss": 1.3669, "step": 9891 }, { "epoch": 0.27, "learning_rate": 1.712496097291772e-05, "loss": 1.3677, "step": 9892 }, { "epoch": 0.27, "learning_rate": 1.71243403075126e-05, "loss": 1.4797, "step": 9893 }, { "epoch": 0.27, "learning_rate": 1.7123719586369985e-05, "loss": 1.1804, "step": 9894 }, { "epoch": 0.27, "learning_rate": 1.7123098809494737e-05, "loss": 1.2603, "step": 9895 }, { "epoch": 0.27, "learning_rate": 1.712247797689172e-05, "loss": 1.4011, "step": 9896 }, { "epoch": 0.27, "learning_rate": 1.712185708856578e-05, "loss": 1.3796, "step": 9897 }, { "epoch": 0.27, "learning_rate": 1.712123614452178e-05, "loss": 1.2847, "step": 9898 }, { "epoch": 0.27, "learning_rate": 1.712061514476458e-05, "loss": 1.2964, "step": 9899 }, { "epoch": 0.27, "learning_rate": 1.711999408929903e-05, "loss": 1.3298, "step": 9900 }, { "epoch": 0.27, "learning_rate": 1.711937297813e-05, "loss": 1.2383, "step": 9901 }, { "epoch": 0.27, "learning_rate": 1.7118751811262338e-05, "loss": 1.354, "step": 9902 }, { "epoch": 0.27, "learning_rate": 1.7118130588700916e-05, "loss": 1.3552, "step": 9903 }, { "epoch": 0.27, "learning_rate": 1.711750931045058e-05, "loss": 1.2949, "step": 9904 }, { "epoch": 0.27, "learning_rate": 1.71168879765162e-05, "loss": 1.3159, "step": 9905 }, { "epoch": 0.27, "learning_rate": 1.7116266586902635e-05, "loss": 1.2654, "step": 9906 }, { "epoch": 0.27, "learning_rate": 1.711564514161475e-05, "loss": 1.3823, "step": 9907 }, { "epoch": 0.27, "learning_rate": 1.7115023640657402e-05, "loss": 1.2498, "step": 9908 }, { "epoch": 0.27, "learning_rate": 1.7114402084035452e-05, "loss": 1.3694, "step": 9909 }, { "epoch": 0.27, "learning_rate": 1.711378047175377e-05, "loss": 1.3813, "step": 9910 }, { "epoch": 0.27, "learning_rate": 1.7113158803817214e-05, "loss": 1.0388, "step": 9911 }, { "epoch": 0.27, "learning_rate": 1.7112537080230646e-05, "loss": 1.2864, "step": 9912 }, { "epoch": 0.27, "learning_rate": 1.7111915300998934e-05, "loss": 1.3552, "step": 9913 }, { "epoch": 0.27, "learning_rate": 1.7111293466126938e-05, "loss": 1.4226, "step": 9914 }, { "epoch": 0.27, "learning_rate": 1.7110671575619528e-05, "loss": 1.2112, "step": 9915 }, { "epoch": 0.27, "learning_rate": 1.711004962948157e-05, "loss": 1.4116, "step": 9916 }, { "epoch": 0.27, "learning_rate": 1.7109427627717923e-05, "loss": 1.2227, "step": 9917 }, { "epoch": 0.27, "learning_rate": 1.710880557033346e-05, "loss": 1.4897, "step": 9918 }, { "epoch": 0.27, "learning_rate": 1.7108183457333044e-05, "loss": 1.4307, "step": 9919 }, { "epoch": 0.27, "learning_rate": 1.7107561288721543e-05, "loss": 1.3135, "step": 9920 }, { "epoch": 0.27, "learning_rate": 1.7106939064503823e-05, "loss": 1.3167, "step": 9921 }, { "epoch": 0.27, "learning_rate": 1.7106316784684756e-05, "loss": 1.3567, "step": 9922 }, { "epoch": 0.27, "learning_rate": 1.7105694449269207e-05, "loss": 1.3608, "step": 9923 }, { "epoch": 0.27, "learning_rate": 1.7105072058262043e-05, "loss": 1.3345, "step": 9924 }, { "epoch": 0.27, "learning_rate": 1.7104449611668142e-05, "loss": 1.1272, "step": 9925 }, { "epoch": 0.27, "learning_rate": 1.7103827109492365e-05, "loss": 1.2336, "step": 9926 }, { "epoch": 0.27, "learning_rate": 1.7103204551739586e-05, "loss": 1.448, "step": 9927 }, { "epoch": 0.27, "learning_rate": 1.7102581938414676e-05, "loss": 1.384, "step": 9928 }, { "epoch": 0.27, "learning_rate": 1.7101959269522504e-05, "loss": 1.2861, "step": 9929 }, { "epoch": 0.27, "learning_rate": 1.710133654506794e-05, "loss": 1.4575, "step": 9930 }, { "epoch": 0.27, "learning_rate": 1.710071376505586e-05, "loss": 1.3711, "step": 9931 }, { "epoch": 0.27, "learning_rate": 1.7100090929491132e-05, "loss": 1.3943, "step": 9932 }, { "epoch": 0.27, "learning_rate": 1.7099468038378636e-05, "loss": 1.3365, "step": 9933 }, { "epoch": 0.27, "learning_rate": 1.709884509172324e-05, "loss": 1.4185, "step": 9934 }, { "epoch": 0.27, "learning_rate": 1.7098222089529816e-05, "loss": 1.4443, "step": 9935 }, { "epoch": 0.27, "learning_rate": 1.709759903180324e-05, "loss": 1.4258, "step": 9936 }, { "epoch": 0.27, "learning_rate": 1.7096975918548384e-05, "loss": 1.4009, "step": 9937 }, { "epoch": 0.27, "learning_rate": 1.709635274977013e-05, "loss": 1.3657, "step": 9938 }, { "epoch": 0.27, "learning_rate": 1.7095729525473347e-05, "loss": 1.2869, "step": 9939 }, { "epoch": 0.27, "learning_rate": 1.7095106245662914e-05, "loss": 1.2551, "step": 9940 }, { "epoch": 0.27, "learning_rate": 1.7094482910343704e-05, "loss": 1.2866, "step": 9941 }, { "epoch": 0.27, "learning_rate": 1.7093859519520598e-05, "loss": 1.3965, "step": 9942 }, { "epoch": 0.27, "learning_rate": 1.709323607319847e-05, "loss": 1.3101, "step": 9943 }, { "epoch": 0.27, "learning_rate": 1.7092612571382198e-05, "loss": 1.4766, "step": 9944 }, { "epoch": 0.27, "learning_rate": 1.7091989014076663e-05, "loss": 1.3218, "step": 9945 }, { "epoch": 0.27, "learning_rate": 1.709136540128674e-05, "loss": 1.4604, "step": 9946 }, { "epoch": 0.27, "learning_rate": 1.7090741733017306e-05, "loss": 1.1863, "step": 9947 }, { "epoch": 0.27, "learning_rate": 1.7090118009273246e-05, "loss": 1.1465, "step": 9948 }, { "epoch": 0.27, "learning_rate": 1.7089494230059434e-05, "loss": 1.3474, "step": 9949 }, { "epoch": 0.27, "learning_rate": 1.7088870395380756e-05, "loss": 1.3477, "step": 9950 }, { "epoch": 0.27, "learning_rate": 1.7088246505242084e-05, "loss": 1.3701, "step": 9951 }, { "epoch": 0.27, "learning_rate": 1.7087622559648308e-05, "loss": 1.333, "step": 9952 }, { "epoch": 0.27, "learning_rate": 1.7086998558604306e-05, "loss": 1.2576, "step": 9953 }, { "epoch": 0.27, "learning_rate": 1.7086374502114963e-05, "loss": 1.3455, "step": 9954 }, { "epoch": 0.27, "learning_rate": 1.7085750390185153e-05, "loss": 1.3694, "step": 9955 }, { "epoch": 0.27, "learning_rate": 1.7085126222819767e-05, "loss": 1.2791, "step": 9956 }, { "epoch": 0.27, "learning_rate": 1.708450200002368e-05, "loss": 1.3457, "step": 9957 }, { "epoch": 0.27, "learning_rate": 1.7083877721801787e-05, "loss": 1.2798, "step": 9958 }, { "epoch": 0.27, "learning_rate": 1.708325338815896e-05, "loss": 1.2966, "step": 9959 }, { "epoch": 0.27, "learning_rate": 1.7082628999100096e-05, "loss": 1.3394, "step": 9960 }, { "epoch": 0.27, "learning_rate": 1.708200455463007e-05, "loss": 1.3242, "step": 9961 }, { "epoch": 0.27, "learning_rate": 1.7081380054753772e-05, "loss": 1.3296, "step": 9962 }, { "epoch": 0.27, "learning_rate": 1.7080755499476082e-05, "loss": 1.3367, "step": 9963 }, { "epoch": 0.27, "learning_rate": 1.7080130888801895e-05, "loss": 1.3247, "step": 9964 }, { "epoch": 0.27, "learning_rate": 1.707950622273609e-05, "loss": 1.4175, "step": 9965 }, { "epoch": 0.27, "learning_rate": 1.707888150128356e-05, "loss": 1.3267, "step": 9966 }, { "epoch": 0.27, "learning_rate": 1.7078256724449186e-05, "loss": 1.3662, "step": 9967 }, { "epoch": 0.27, "learning_rate": 1.7077631892237864e-05, "loss": 1.2444, "step": 9968 }, { "epoch": 0.27, "learning_rate": 1.707700700465448e-05, "loss": 1.3655, "step": 9969 }, { "epoch": 0.27, "learning_rate": 1.7076382061703916e-05, "loss": 1.1021, "step": 9970 }, { "epoch": 0.27, "learning_rate": 1.7075757063391067e-05, "loss": 1.3118, "step": 9971 }, { "epoch": 0.27, "learning_rate": 1.7075132009720824e-05, "loss": 1.3567, "step": 9972 }, { "epoch": 0.27, "learning_rate": 1.7074506900698072e-05, "loss": 1.4502, "step": 9973 }, { "epoch": 0.27, "learning_rate": 1.707388173632771e-05, "loss": 1.355, "step": 9974 }, { "epoch": 0.27, "learning_rate": 1.707325651661462e-05, "loss": 1.3008, "step": 9975 }, { "epoch": 0.27, "learning_rate": 1.7072631241563698e-05, "loss": 1.3835, "step": 9976 }, { "epoch": 0.27, "learning_rate": 1.7072005911179835e-05, "loss": 1.323, "step": 9977 }, { "epoch": 0.27, "learning_rate": 1.7071380525467923e-05, "loss": 1.3442, "step": 9978 }, { "epoch": 0.27, "learning_rate": 1.7070755084432854e-05, "loss": 1.2688, "step": 9979 }, { "epoch": 0.27, "learning_rate": 1.7070129588079522e-05, "loss": 1.3364, "step": 9980 }, { "epoch": 0.27, "learning_rate": 1.7069504036412822e-05, "loss": 1.3257, "step": 9981 }, { "epoch": 0.27, "learning_rate": 1.706887842943765e-05, "loss": 1.323, "step": 9982 }, { "epoch": 0.27, "learning_rate": 1.706825276715889e-05, "loss": 1.3416, "step": 9983 }, { "epoch": 0.27, "learning_rate": 1.706762704958145e-05, "loss": 1.4092, "step": 9984 }, { "epoch": 0.27, "learning_rate": 1.7067001276710214e-05, "loss": 1.3572, "step": 9985 }, { "epoch": 0.27, "learning_rate": 1.7066375448550087e-05, "loss": 1.3855, "step": 9986 }, { "epoch": 0.27, "learning_rate": 1.706574956510596e-05, "loss": 1.417, "step": 9987 }, { "epoch": 0.27, "learning_rate": 1.7065123626382735e-05, "loss": 1.3376, "step": 9988 }, { "epoch": 0.27, "learning_rate": 1.70644976323853e-05, "loss": 1.1973, "step": 9989 }, { "epoch": 0.27, "learning_rate": 1.706387158311856e-05, "loss": 1.2695, "step": 9990 }, { "epoch": 0.27, "learning_rate": 1.7063245478587408e-05, "loss": 1.3896, "step": 9991 }, { "epoch": 0.27, "learning_rate": 1.7062619318796747e-05, "loss": 1.4424, "step": 9992 }, { "epoch": 0.27, "learning_rate": 1.7061993103751474e-05, "loss": 1.332, "step": 9993 }, { "epoch": 0.27, "learning_rate": 1.7061366833456486e-05, "loss": 1.2979, "step": 9994 }, { "epoch": 0.27, "learning_rate": 1.7060740507916683e-05, "loss": 1.4258, "step": 9995 }, { "epoch": 0.27, "learning_rate": 1.706011412713697e-05, "loss": 1.3662, "step": 9996 }, { "epoch": 0.27, "learning_rate": 1.705948769112224e-05, "loss": 1.3728, "step": 9997 }, { "epoch": 0.27, "learning_rate": 1.70588611998774e-05, "loss": 1.3157, "step": 9998 }, { "epoch": 0.27, "learning_rate": 1.705823465340735e-05, "loss": 1.3223, "step": 9999 }, { "epoch": 0.27, "learning_rate": 1.705760805171699e-05, "loss": 1.2937, "step": 10000 }, { "epoch": 0.27, "learning_rate": 1.7056981394811222e-05, "loss": 1.3501, "step": 10001 }, { "epoch": 0.27, "learning_rate": 1.7056354682694955e-05, "loss": 1.1863, "step": 10002 }, { "epoch": 0.27, "learning_rate": 1.7055727915373084e-05, "loss": 1.4512, "step": 10003 }, { "epoch": 0.27, "learning_rate": 1.7055101092850513e-05, "loss": 1.3601, "step": 10004 }, { "epoch": 0.27, "learning_rate": 1.705447421513215e-05, "loss": 1.4153, "step": 10005 }, { "epoch": 0.27, "learning_rate": 1.7053847282222902e-05, "loss": 1.3262, "step": 10006 }, { "epoch": 0.27, "learning_rate": 1.7053220294127667e-05, "loss": 1.4294, "step": 10007 }, { "epoch": 0.27, "learning_rate": 1.7052593250851353e-05, "loss": 1.1455, "step": 10008 }, { "epoch": 0.27, "learning_rate": 1.7051966152398868e-05, "loss": 1.3777, "step": 10009 }, { "epoch": 0.27, "learning_rate": 1.705133899877511e-05, "loss": 1.166, "step": 10010 }, { "epoch": 0.27, "learning_rate": 1.7050711789984996e-05, "loss": 1.3315, "step": 10011 }, { "epoch": 0.27, "learning_rate": 1.7050084526033428e-05, "loss": 1.4128, "step": 10012 }, { "epoch": 0.27, "learning_rate": 1.7049457206925313e-05, "loss": 1.2117, "step": 10013 }, { "epoch": 0.27, "learning_rate": 1.704882983266556e-05, "loss": 1.4194, "step": 10014 }, { "epoch": 0.27, "learning_rate": 1.7048202403259077e-05, "loss": 1.3811, "step": 10015 }, { "epoch": 0.27, "learning_rate": 1.704757491871077e-05, "loss": 1.2412, "step": 10016 }, { "epoch": 0.27, "learning_rate": 1.7046947379025556e-05, "loss": 1.3762, "step": 10017 }, { "epoch": 0.27, "learning_rate": 1.704631978420834e-05, "loss": 1.3716, "step": 10018 }, { "epoch": 0.27, "learning_rate": 1.7045692134264026e-05, "loss": 1.4126, "step": 10019 }, { "epoch": 0.27, "learning_rate": 1.7045064429197532e-05, "loss": 1.4739, "step": 10020 }, { "epoch": 0.27, "learning_rate": 1.7044436669013768e-05, "loss": 1.1772, "step": 10021 }, { "epoch": 0.27, "learning_rate": 1.7043808853717643e-05, "loss": 1.4434, "step": 10022 }, { "epoch": 0.27, "learning_rate": 1.704318098331407e-05, "loss": 1.4285, "step": 10023 }, { "epoch": 0.27, "learning_rate": 1.7042553057807962e-05, "loss": 1.3203, "step": 10024 }, { "epoch": 0.27, "learning_rate": 1.7041925077204226e-05, "loss": 1.2754, "step": 10025 }, { "epoch": 0.27, "learning_rate": 1.7041297041507783e-05, "loss": 1.3616, "step": 10026 }, { "epoch": 0.27, "learning_rate": 1.7040668950723546e-05, "loss": 1.4011, "step": 10027 }, { "epoch": 0.27, "learning_rate": 1.704004080485642e-05, "loss": 1.3191, "step": 10028 }, { "epoch": 0.27, "learning_rate": 1.7039412603911328e-05, "loss": 1.4785, "step": 10029 }, { "epoch": 0.27, "learning_rate": 1.7038784347893182e-05, "loss": 1.2896, "step": 10030 }, { "epoch": 0.27, "learning_rate": 1.7038156036806897e-05, "loss": 1.4248, "step": 10031 }, { "epoch": 0.27, "learning_rate": 1.703752767065739e-05, "loss": 1.4038, "step": 10032 }, { "epoch": 0.27, "learning_rate": 1.7036899249449573e-05, "loss": 1.2917, "step": 10033 }, { "epoch": 0.27, "learning_rate": 1.7036270773188367e-05, "loss": 1.3586, "step": 10034 }, { "epoch": 0.27, "learning_rate": 1.703564224187869e-05, "loss": 1.2542, "step": 10035 }, { "epoch": 0.27, "learning_rate": 1.7035013655525453e-05, "loss": 1.4009, "step": 10036 }, { "epoch": 0.27, "learning_rate": 1.7034385014133575e-05, "loss": 1.499, "step": 10037 }, { "epoch": 0.27, "learning_rate": 1.703375631770798e-05, "loss": 1.3667, "step": 10038 }, { "epoch": 0.27, "learning_rate": 1.7033127566253582e-05, "loss": 1.3569, "step": 10039 }, { "epoch": 0.27, "learning_rate": 1.7032498759775304e-05, "loss": 1.4805, "step": 10040 }, { "epoch": 0.27, "learning_rate": 1.7031869898278058e-05, "loss": 1.3418, "step": 10041 }, { "epoch": 0.27, "learning_rate": 1.703124098176677e-05, "loss": 1.4089, "step": 10042 }, { "epoch": 0.27, "learning_rate": 1.703061201024636e-05, "loss": 1.3386, "step": 10043 }, { "epoch": 0.27, "learning_rate": 1.7029982983721746e-05, "loss": 1.3936, "step": 10044 }, { "epoch": 0.27, "learning_rate": 1.7029353902197853e-05, "loss": 1.4365, "step": 10045 }, { "epoch": 0.27, "learning_rate": 1.7028724765679597e-05, "loss": 1.4185, "step": 10046 }, { "epoch": 0.27, "learning_rate": 1.7028095574171905e-05, "loss": 1.3757, "step": 10047 }, { "epoch": 0.27, "learning_rate": 1.70274663276797e-05, "loss": 1.2917, "step": 10048 }, { "epoch": 0.27, "learning_rate": 1.7026837026207903e-05, "loss": 1.3301, "step": 10049 }, { "epoch": 0.27, "learning_rate": 1.7026207669761436e-05, "loss": 1.1704, "step": 10050 }, { "epoch": 0.27, "learning_rate": 1.7025578258345227e-05, "loss": 1.3513, "step": 10051 }, { "epoch": 0.27, "learning_rate": 1.7024948791964193e-05, "loss": 1.3984, "step": 10052 }, { "epoch": 0.27, "learning_rate": 1.7024319270623263e-05, "loss": 1.2761, "step": 10053 }, { "epoch": 0.27, "learning_rate": 1.702368969432737e-05, "loss": 1.394, "step": 10054 }, { "epoch": 0.27, "learning_rate": 1.7023060063081424e-05, "loss": 1.3965, "step": 10055 }, { "epoch": 0.27, "learning_rate": 1.7022430376890356e-05, "loss": 1.249, "step": 10056 }, { "epoch": 0.27, "learning_rate": 1.7021800635759102e-05, "loss": 1.4314, "step": 10057 }, { "epoch": 0.27, "learning_rate": 1.7021170839692577e-05, "loss": 1.4211, "step": 10058 }, { "epoch": 0.27, "learning_rate": 1.7020540988695715e-05, "loss": 1.2095, "step": 10059 }, { "epoch": 0.27, "learning_rate": 1.701991108277344e-05, "loss": 1.3433, "step": 10060 }, { "epoch": 0.27, "learning_rate": 1.7019281121930684e-05, "loss": 1.3274, "step": 10061 }, { "epoch": 0.27, "learning_rate": 1.701865110617237e-05, "loss": 1.3752, "step": 10062 }, { "epoch": 0.27, "learning_rate": 1.7018021035503433e-05, "loss": 1.3811, "step": 10063 }, { "epoch": 0.27, "learning_rate": 1.70173909099288e-05, "loss": 1.438, "step": 10064 }, { "epoch": 0.27, "learning_rate": 1.70167607294534e-05, "loss": 1.4719, "step": 10065 }, { "epoch": 0.27, "learning_rate": 1.7016130494082165e-05, "loss": 1.061, "step": 10066 }, { "epoch": 0.27, "learning_rate": 1.701550020382002e-05, "loss": 1.2332, "step": 10067 }, { "epoch": 0.27, "learning_rate": 1.7014869858671902e-05, "loss": 1.229, "step": 10068 }, { "epoch": 0.27, "learning_rate": 1.7014239458642744e-05, "loss": 1.3982, "step": 10069 }, { "epoch": 0.28, "learning_rate": 1.701360900373747e-05, "loss": 1.3809, "step": 10070 }, { "epoch": 0.28, "learning_rate": 1.701297849396102e-05, "loss": 1.3301, "step": 10071 }, { "epoch": 0.28, "learning_rate": 1.701234792931832e-05, "loss": 1.531, "step": 10072 }, { "epoch": 0.28, "learning_rate": 1.701171730981431e-05, "loss": 1.3362, "step": 10073 }, { "epoch": 0.28, "learning_rate": 1.701108663545392e-05, "loss": 1.3228, "step": 10074 }, { "epoch": 0.28, "learning_rate": 1.7010455906242088e-05, "loss": 1.3477, "step": 10075 }, { "epoch": 0.28, "learning_rate": 1.7009825122183743e-05, "loss": 1.324, "step": 10076 }, { "epoch": 0.28, "learning_rate": 1.7009194283283827e-05, "loss": 1.5239, "step": 10077 }, { "epoch": 0.28, "learning_rate": 1.7008563389547265e-05, "loss": 1.3914, "step": 10078 }, { "epoch": 0.28, "learning_rate": 1.7007932440979e-05, "loss": 1.2341, "step": 10079 }, { "epoch": 0.28, "learning_rate": 1.7007301437583968e-05, "loss": 1.3696, "step": 10080 }, { "epoch": 0.28, "learning_rate": 1.7006670379367106e-05, "loss": 1.3511, "step": 10081 }, { "epoch": 0.28, "learning_rate": 1.700603926633335e-05, "loss": 1.312, "step": 10082 }, { "epoch": 0.28, "learning_rate": 1.7005408098487635e-05, "loss": 1.3369, "step": 10083 }, { "epoch": 0.28, "learning_rate": 1.70047768758349e-05, "loss": 1.3193, "step": 10084 }, { "epoch": 0.28, "learning_rate": 1.7004145598380085e-05, "loss": 1.2217, "step": 10085 }, { "epoch": 0.28, "learning_rate": 1.7003514266128132e-05, "loss": 1.3442, "step": 10086 }, { "epoch": 0.28, "learning_rate": 1.7002882879083973e-05, "loss": 1.415, "step": 10087 }, { "epoch": 0.28, "learning_rate": 1.7002251437252554e-05, "loss": 1.3054, "step": 10088 }, { "epoch": 0.28, "learning_rate": 1.700161994063881e-05, "loss": 1.3813, "step": 10089 }, { "epoch": 0.28, "learning_rate": 1.7000988389247685e-05, "loss": 1.5449, "step": 10090 }, { "epoch": 0.28, "learning_rate": 1.700035678308412e-05, "loss": 1.2393, "step": 10091 }, { "epoch": 0.28, "learning_rate": 1.699972512215305e-05, "loss": 1.3665, "step": 10092 }, { "epoch": 0.28, "learning_rate": 1.699909340645943e-05, "loss": 1.2896, "step": 10093 }, { "epoch": 0.28, "learning_rate": 1.6998461636008193e-05, "loss": 1.491, "step": 10094 }, { "epoch": 0.28, "learning_rate": 1.6997829810804282e-05, "loss": 1.5645, "step": 10095 }, { "epoch": 0.28, "learning_rate": 1.6997197930852636e-05, "loss": 1.2869, "step": 10096 }, { "epoch": 0.28, "learning_rate": 1.699656599615821e-05, "loss": 1.3784, "step": 10097 }, { "epoch": 0.28, "learning_rate": 1.699593400672594e-05, "loss": 1.4436, "step": 10098 }, { "epoch": 0.28, "learning_rate": 1.699530196256077e-05, "loss": 1.1997, "step": 10099 }, { "epoch": 0.28, "learning_rate": 1.699466986366765e-05, "loss": 1.3892, "step": 10100 }, { "epoch": 0.28, "learning_rate": 1.699403771005152e-05, "loss": 1.3093, "step": 10101 }, { "epoch": 0.28, "learning_rate": 1.699340550171733e-05, "loss": 1.2969, "step": 10102 }, { "epoch": 0.28, "learning_rate": 1.699277323867002e-05, "loss": 1.2173, "step": 10103 }, { "epoch": 0.28, "learning_rate": 1.699214092091454e-05, "loss": 1.4795, "step": 10104 }, { "epoch": 0.28, "learning_rate": 1.6991508548455843e-05, "loss": 1.2517, "step": 10105 }, { "epoch": 0.28, "learning_rate": 1.6990876121298867e-05, "loss": 1.2473, "step": 10106 }, { "epoch": 0.28, "learning_rate": 1.6990243639448563e-05, "loss": 1.4429, "step": 10107 }, { "epoch": 0.28, "learning_rate": 1.6989611102909883e-05, "loss": 1.8262, "step": 10108 }, { "epoch": 0.28, "learning_rate": 1.698897851168777e-05, "loss": 1.3083, "step": 10109 }, { "epoch": 0.28, "learning_rate": 1.6988345865787176e-05, "loss": 1.2634, "step": 10110 }, { "epoch": 0.28, "learning_rate": 1.698771316521305e-05, "loss": 1.4058, "step": 10111 }, { "epoch": 0.28, "learning_rate": 1.6987080409970344e-05, "loss": 1.4526, "step": 10112 }, { "epoch": 0.28, "learning_rate": 1.6986447600064004e-05, "loss": 1.2246, "step": 10113 }, { "epoch": 0.28, "learning_rate": 1.6985814735498984e-05, "loss": 1.478, "step": 10114 }, { "epoch": 0.28, "learning_rate": 1.6985181816280233e-05, "loss": 1.1558, "step": 10115 }, { "epoch": 0.28, "learning_rate": 1.6984548842412705e-05, "loss": 1.2656, "step": 10116 }, { "epoch": 0.28, "learning_rate": 1.698391581390135e-05, "loss": 1.4412, "step": 10117 }, { "epoch": 0.28, "learning_rate": 1.6983282730751127e-05, "loss": 1.4023, "step": 10118 }, { "epoch": 0.28, "learning_rate": 1.698264959296698e-05, "loss": 1.3804, "step": 10119 }, { "epoch": 0.28, "learning_rate": 1.6982016400553866e-05, "loss": 1.2847, "step": 10120 }, { "epoch": 0.28, "learning_rate": 1.698138315351674e-05, "loss": 1.2227, "step": 10121 }, { "epoch": 0.28, "learning_rate": 1.6980749851860553e-05, "loss": 1.2996, "step": 10122 }, { "epoch": 0.28, "learning_rate": 1.6980116495590264e-05, "loss": 1.2615, "step": 10123 }, { "epoch": 0.28, "learning_rate": 1.6979483084710822e-05, "loss": 1.6133, "step": 10124 }, { "epoch": 0.28, "learning_rate": 1.697884961922719e-05, "loss": 1.4028, "step": 10125 }, { "epoch": 0.28, "learning_rate": 1.6978216099144322e-05, "loss": 1.175, "step": 10126 }, { "epoch": 0.28, "learning_rate": 1.697758252446717e-05, "loss": 1.4895, "step": 10127 }, { "epoch": 0.28, "learning_rate": 1.697694889520069e-05, "loss": 1.3142, "step": 10128 }, { "epoch": 0.28, "learning_rate": 1.6976315211349848e-05, "loss": 1.2102, "step": 10129 }, { "epoch": 0.28, "learning_rate": 1.6975681472919598e-05, "loss": 1.2576, "step": 10130 }, { "epoch": 0.28, "learning_rate": 1.697504767991489e-05, "loss": 1.1265, "step": 10131 }, { "epoch": 0.28, "learning_rate": 1.697441383234069e-05, "loss": 1.1492, "step": 10132 }, { "epoch": 0.28, "learning_rate": 1.697377993020196e-05, "loss": 1.3691, "step": 10133 }, { "epoch": 0.28, "learning_rate": 1.697314597350365e-05, "loss": 1.1411, "step": 10134 }, { "epoch": 0.28, "learning_rate": 1.697251196225073e-05, "loss": 1.2786, "step": 10135 }, { "epoch": 0.28, "learning_rate": 1.697187789644815e-05, "loss": 1.6938, "step": 10136 }, { "epoch": 0.28, "learning_rate": 1.697124377610088e-05, "loss": 1.301, "step": 10137 }, { "epoch": 0.28, "learning_rate": 1.6970609601213873e-05, "loss": 1.3091, "step": 10138 }, { "epoch": 0.28, "learning_rate": 1.69699753717921e-05, "loss": 1.2458, "step": 10139 }, { "epoch": 0.28, "learning_rate": 1.696934108784051e-05, "loss": 1.3767, "step": 10140 }, { "epoch": 0.28, "learning_rate": 1.6968706749364077e-05, "loss": 1.3857, "step": 10141 }, { "epoch": 0.28, "learning_rate": 1.696807235636776e-05, "loss": 1.4238, "step": 10142 }, { "epoch": 0.28, "learning_rate": 1.6967437908856517e-05, "loss": 1.3252, "step": 10143 }, { "epoch": 0.28, "learning_rate": 1.6966803406835318e-05, "loss": 1.415, "step": 10144 }, { "epoch": 0.28, "learning_rate": 1.6966168850309128e-05, "loss": 1.3003, "step": 10145 }, { "epoch": 0.28, "learning_rate": 1.696553423928291e-05, "loss": 1.2175, "step": 10146 }, { "epoch": 0.28, "learning_rate": 1.696489957376162e-05, "loss": 1.354, "step": 10147 }, { "epoch": 0.28, "learning_rate": 1.6964264853750235e-05, "loss": 1.1887, "step": 10148 }, { "epoch": 0.28, "learning_rate": 1.696363007925372e-05, "loss": 1.7969, "step": 10149 }, { "epoch": 0.28, "learning_rate": 1.6962995250277033e-05, "loss": 1.291, "step": 10150 }, { "epoch": 0.28, "learning_rate": 1.6962360366825147e-05, "loss": 1.3496, "step": 10151 }, { "epoch": 0.28, "learning_rate": 1.696172542890303e-05, "loss": 1.2041, "step": 10152 }, { "epoch": 0.28, "learning_rate": 1.6961090436515643e-05, "loss": 1.1428, "step": 10153 }, { "epoch": 0.28, "learning_rate": 1.6960455389667958e-05, "loss": 1.2322, "step": 10154 }, { "epoch": 0.28, "learning_rate": 1.6959820288364945e-05, "loss": 1.4175, "step": 10155 }, { "epoch": 0.28, "learning_rate": 1.6959185132611567e-05, "loss": 1.4326, "step": 10156 }, { "epoch": 0.28, "learning_rate": 1.6958549922412802e-05, "loss": 1.3564, "step": 10157 }, { "epoch": 0.28, "learning_rate": 1.695791465777361e-05, "loss": 1.4587, "step": 10158 }, { "epoch": 0.28, "learning_rate": 1.6957279338698972e-05, "loss": 1.8267, "step": 10159 }, { "epoch": 0.28, "learning_rate": 1.6956643965193847e-05, "loss": 1.4292, "step": 10160 }, { "epoch": 0.28, "learning_rate": 1.695600853726321e-05, "loss": 1.269, "step": 10161 }, { "epoch": 0.28, "learning_rate": 1.6955373054912038e-05, "loss": 1.2983, "step": 10162 }, { "epoch": 0.28, "learning_rate": 1.6954737518145294e-05, "loss": 1.3232, "step": 10163 }, { "epoch": 0.28, "learning_rate": 1.6954101926967955e-05, "loss": 1.4341, "step": 10164 }, { "epoch": 0.28, "learning_rate": 1.695346628138499e-05, "loss": 1.2798, "step": 10165 }, { "epoch": 0.28, "learning_rate": 1.6952830581401375e-05, "loss": 1.2881, "step": 10166 }, { "epoch": 0.28, "learning_rate": 1.695219482702209e-05, "loss": 1.3105, "step": 10167 }, { "epoch": 0.28, "learning_rate": 1.6951559018252096e-05, "loss": 1.3621, "step": 10168 }, { "epoch": 0.28, "learning_rate": 1.695092315509637e-05, "loss": 1.394, "step": 10169 }, { "epoch": 0.28, "learning_rate": 1.6950287237559898e-05, "loss": 1.3892, "step": 10170 }, { "epoch": 0.28, "learning_rate": 1.694965126564764e-05, "loss": 1.2043, "step": 10171 }, { "epoch": 0.28, "learning_rate": 1.694901523936458e-05, "loss": 1.3162, "step": 10172 }, { "epoch": 0.28, "learning_rate": 1.6948379158715696e-05, "loss": 1.4075, "step": 10173 }, { "epoch": 0.28, "learning_rate": 1.6947743023705956e-05, "loss": 1.283, "step": 10174 }, { "epoch": 0.28, "learning_rate": 1.6947106834340347e-05, "loss": 0.9939, "step": 10175 }, { "epoch": 0.28, "learning_rate": 1.694647059062384e-05, "loss": 1.3362, "step": 10176 }, { "epoch": 0.28, "learning_rate": 1.6945834292561408e-05, "loss": 1.4324, "step": 10177 }, { "epoch": 0.28, "learning_rate": 1.694519794015804e-05, "loss": 1.3235, "step": 10178 }, { "epoch": 0.28, "learning_rate": 1.6944561533418707e-05, "loss": 1.1147, "step": 10179 }, { "epoch": 0.28, "learning_rate": 1.6943925072348388e-05, "loss": 1.4739, "step": 10180 }, { "epoch": 0.28, "learning_rate": 1.694328855695207e-05, "loss": 1.3096, "step": 10181 }, { "epoch": 0.28, "learning_rate": 1.694265198723472e-05, "loss": 1.3765, "step": 10182 }, { "epoch": 0.28, "learning_rate": 1.694201536320133e-05, "loss": 1.3608, "step": 10183 }, { "epoch": 0.28, "learning_rate": 1.694137868485688e-05, "loss": 1.3479, "step": 10184 }, { "epoch": 0.28, "learning_rate": 1.6940741952206342e-05, "loss": 1.2622, "step": 10185 }, { "epoch": 0.28, "learning_rate": 1.6940105165254703e-05, "loss": 1.3696, "step": 10186 }, { "epoch": 0.28, "learning_rate": 1.6939468324006943e-05, "loss": 1.3879, "step": 10187 }, { "epoch": 0.28, "learning_rate": 1.693883142846805e-05, "loss": 1.1277, "step": 10188 }, { "epoch": 0.28, "learning_rate": 1.6938194478643e-05, "loss": 1.2971, "step": 10189 }, { "epoch": 0.28, "learning_rate": 1.6937557474536783e-05, "loss": 1.47, "step": 10190 }, { "epoch": 0.28, "learning_rate": 1.6936920416154373e-05, "loss": 1.2932, "step": 10191 }, { "epoch": 0.28, "learning_rate": 1.693628330350076e-05, "loss": 1.415, "step": 10192 }, { "epoch": 0.28, "learning_rate": 1.6935646136580936e-05, "loss": 1.2378, "step": 10193 }, { "epoch": 0.28, "learning_rate": 1.693500891539987e-05, "loss": 1.2856, "step": 10194 }, { "epoch": 0.28, "learning_rate": 1.693437163996256e-05, "loss": 1.397, "step": 10195 }, { "epoch": 0.28, "learning_rate": 1.6933734310273982e-05, "loss": 1.2605, "step": 10196 }, { "epoch": 0.28, "learning_rate": 1.6933096926339132e-05, "loss": 1.4395, "step": 10197 }, { "epoch": 0.28, "learning_rate": 1.693245948816299e-05, "loss": 1.4329, "step": 10198 }, { "epoch": 0.28, "learning_rate": 1.6931821995750544e-05, "loss": 1.4595, "step": 10199 }, { "epoch": 0.28, "learning_rate": 1.6931184449106783e-05, "loss": 1.3311, "step": 10200 }, { "epoch": 0.28, "learning_rate": 1.6930546848236695e-05, "loss": 1.4224, "step": 10201 }, { "epoch": 0.28, "learning_rate": 1.6929909193145267e-05, "loss": 1.3926, "step": 10202 }, { "epoch": 0.28, "learning_rate": 1.6929271483837486e-05, "loss": 1.4561, "step": 10203 }, { "epoch": 0.28, "learning_rate": 1.6928633720318346e-05, "loss": 1.3213, "step": 10204 }, { "epoch": 0.28, "learning_rate": 1.6927995902592834e-05, "loss": 1.3865, "step": 10205 }, { "epoch": 0.28, "learning_rate": 1.692735803066594e-05, "loss": 1.2626, "step": 10206 }, { "epoch": 0.28, "learning_rate": 1.6926720104542653e-05, "loss": 1.2065, "step": 10207 }, { "epoch": 0.28, "learning_rate": 1.6926082124227964e-05, "loss": 1.4031, "step": 10208 }, { "epoch": 0.28, "learning_rate": 1.6925444089726867e-05, "loss": 1.1187, "step": 10209 }, { "epoch": 0.28, "learning_rate": 1.692480600104435e-05, "loss": 1.4958, "step": 10210 }, { "epoch": 0.28, "learning_rate": 1.6924167858185406e-05, "loss": 1.304, "step": 10211 }, { "epoch": 0.28, "learning_rate": 1.692352966115503e-05, "loss": 1.425, "step": 10212 }, { "epoch": 0.28, "learning_rate": 1.6922891409958216e-05, "loss": 1.3486, "step": 10213 }, { "epoch": 0.28, "learning_rate": 1.6922253104599953e-05, "loss": 1.3142, "step": 10214 }, { "epoch": 0.28, "learning_rate": 1.6921614745085236e-05, "loss": 1.2314, "step": 10215 }, { "epoch": 0.28, "learning_rate": 1.6920976331419066e-05, "loss": 1.4856, "step": 10216 }, { "epoch": 0.28, "learning_rate": 1.6920337863606427e-05, "loss": 1.3518, "step": 10217 }, { "epoch": 0.28, "learning_rate": 1.691969934165232e-05, "loss": 1.4141, "step": 10218 }, { "epoch": 0.28, "learning_rate": 1.6919060765561736e-05, "loss": 1.4241, "step": 10219 }, { "epoch": 0.28, "learning_rate": 1.6918422135339677e-05, "loss": 1.3354, "step": 10220 }, { "epoch": 0.28, "learning_rate": 1.6917783450991135e-05, "loss": 1.3613, "step": 10221 }, { "epoch": 0.28, "learning_rate": 1.6917144712521108e-05, "loss": 1.4604, "step": 10222 }, { "epoch": 0.28, "learning_rate": 1.6916505919934596e-05, "loss": 1.2708, "step": 10223 }, { "epoch": 0.28, "learning_rate": 1.6915867073236595e-05, "loss": 1.3535, "step": 10224 }, { "epoch": 0.28, "learning_rate": 1.6915228172432096e-05, "loss": 1.2275, "step": 10225 }, { "epoch": 0.28, "learning_rate": 1.6914589217526107e-05, "loss": 1.283, "step": 10226 }, { "epoch": 0.28, "learning_rate": 1.6913950208523626e-05, "loss": 1.2659, "step": 10227 }, { "epoch": 0.28, "learning_rate": 1.6913311145429644e-05, "loss": 1.3047, "step": 10228 }, { "epoch": 0.28, "learning_rate": 1.691267202824917e-05, "loss": 1.3779, "step": 10229 }, { "epoch": 0.28, "learning_rate": 1.69120328569872e-05, "loss": 1.333, "step": 10230 }, { "epoch": 0.28, "learning_rate": 1.6911393631648735e-05, "loss": 1.4092, "step": 10231 }, { "epoch": 0.28, "learning_rate": 1.6910754352238778e-05, "loss": 1.3035, "step": 10232 }, { "epoch": 0.28, "learning_rate": 1.691011501876233e-05, "loss": 1.2607, "step": 10233 }, { "epoch": 0.28, "learning_rate": 1.6909475631224385e-05, "loss": 1.3303, "step": 10234 }, { "epoch": 0.28, "learning_rate": 1.6908836189629957e-05, "loss": 1.3389, "step": 10235 }, { "epoch": 0.28, "learning_rate": 1.6908196693984042e-05, "loss": 1.2432, "step": 10236 }, { "epoch": 0.28, "learning_rate": 1.6907557144291645e-05, "loss": 1.312, "step": 10237 }, { "epoch": 0.28, "learning_rate": 1.6906917540557767e-05, "loss": 1.3618, "step": 10238 }, { "epoch": 0.28, "learning_rate": 1.6906277882787416e-05, "loss": 1.281, "step": 10239 }, { "epoch": 0.28, "learning_rate": 1.6905638170985598e-05, "loss": 1.4321, "step": 10240 }, { "epoch": 0.28, "learning_rate": 1.690499840515731e-05, "loss": 1.3403, "step": 10241 }, { "epoch": 0.28, "learning_rate": 1.6904358585307558e-05, "loss": 1.292, "step": 10242 }, { "epoch": 0.28, "learning_rate": 1.6903718711441354e-05, "loss": 1.3372, "step": 10243 }, { "epoch": 0.28, "learning_rate": 1.6903078783563702e-05, "loss": 1.3418, "step": 10244 }, { "epoch": 0.28, "learning_rate": 1.690243880167961e-05, "loss": 1.2881, "step": 10245 }, { "epoch": 0.28, "learning_rate": 1.690179876579408e-05, "loss": 1.4202, "step": 10246 }, { "epoch": 0.28, "learning_rate": 1.690115867591212e-05, "loss": 1.4248, "step": 10247 }, { "epoch": 0.28, "learning_rate": 1.6900518532038743e-05, "loss": 1.2002, "step": 10248 }, { "epoch": 0.28, "learning_rate": 1.689987833417895e-05, "loss": 1.3857, "step": 10249 }, { "epoch": 0.28, "learning_rate": 1.689923808233776e-05, "loss": 1.285, "step": 10250 }, { "epoch": 0.28, "learning_rate": 1.6898597776520168e-05, "loss": 1.498, "step": 10251 }, { "epoch": 0.28, "learning_rate": 1.6897957416731196e-05, "loss": 1.3516, "step": 10252 }, { "epoch": 0.28, "learning_rate": 1.689731700297585e-05, "loss": 1.2937, "step": 10253 }, { "epoch": 0.28, "learning_rate": 1.6896676535259135e-05, "loss": 1.3462, "step": 10254 }, { "epoch": 0.28, "learning_rate": 1.6896036013586067e-05, "loss": 1.2944, "step": 10255 }, { "epoch": 0.28, "learning_rate": 1.6895395437961655e-05, "loss": 1.3574, "step": 10256 }, { "epoch": 0.28, "learning_rate": 1.6894754808390915e-05, "loss": 1.1111, "step": 10257 }, { "epoch": 0.28, "learning_rate": 1.689411412487885e-05, "loss": 1.3198, "step": 10258 }, { "epoch": 0.28, "learning_rate": 1.689347338743048e-05, "loss": 1.1199, "step": 10259 }, { "epoch": 0.28, "learning_rate": 1.689283259605082e-05, "loss": 1.3657, "step": 10260 }, { "epoch": 0.28, "learning_rate": 1.6892191750744874e-05, "loss": 1.3408, "step": 10261 }, { "epoch": 0.28, "learning_rate": 1.6891550851517664e-05, "loss": 1.4094, "step": 10262 }, { "epoch": 0.28, "learning_rate": 1.68909098983742e-05, "loss": 1.3335, "step": 10263 }, { "epoch": 0.28, "learning_rate": 1.6890268891319498e-05, "loss": 1.3618, "step": 10264 }, { "epoch": 0.28, "learning_rate": 1.6889627830358567e-05, "loss": 1.3379, "step": 10265 }, { "epoch": 0.28, "learning_rate": 1.6888986715496434e-05, "loss": 1.2905, "step": 10266 }, { "epoch": 0.28, "learning_rate": 1.6888345546738106e-05, "loss": 1.2417, "step": 10267 }, { "epoch": 0.28, "learning_rate": 1.6887704324088604e-05, "loss": 1.3892, "step": 10268 }, { "epoch": 0.28, "learning_rate": 1.688706304755294e-05, "loss": 1.4495, "step": 10269 }, { "epoch": 0.28, "learning_rate": 1.688642171713613e-05, "loss": 1.2964, "step": 10270 }, { "epoch": 0.28, "learning_rate": 1.6885780332843198e-05, "loss": 1.4336, "step": 10271 }, { "epoch": 0.28, "learning_rate": 1.688513889467916e-05, "loss": 1.4087, "step": 10272 }, { "epoch": 0.28, "learning_rate": 1.688449740264903e-05, "loss": 1.2944, "step": 10273 }, { "epoch": 0.28, "learning_rate": 1.688385585675783e-05, "loss": 1.1659, "step": 10274 }, { "epoch": 0.28, "learning_rate": 1.688321425701058e-05, "loss": 1.3757, "step": 10275 }, { "epoch": 0.28, "learning_rate": 1.6882572603412296e-05, "loss": 1.26, "step": 10276 }, { "epoch": 0.28, "learning_rate": 1.6881930895968003e-05, "loss": 1.3838, "step": 10277 }, { "epoch": 0.28, "learning_rate": 1.6881289134682718e-05, "loss": 1.3416, "step": 10278 }, { "epoch": 0.28, "learning_rate": 1.6880647319561463e-05, "loss": 1.3882, "step": 10279 }, { "epoch": 0.28, "learning_rate": 1.6880005450609257e-05, "loss": 1.4028, "step": 10280 }, { "epoch": 0.28, "learning_rate": 1.6879363527831127e-05, "loss": 1.2407, "step": 10281 }, { "epoch": 0.28, "learning_rate": 1.687872155123209e-05, "loss": 1.3691, "step": 10282 }, { "epoch": 0.28, "learning_rate": 1.687807952081717e-05, "loss": 1.5181, "step": 10283 }, { "epoch": 0.28, "learning_rate": 1.687743743659139e-05, "loss": 1.3328, "step": 10284 }, { "epoch": 0.28, "learning_rate": 1.687679529855977e-05, "loss": 1.3579, "step": 10285 }, { "epoch": 0.28, "learning_rate": 1.6876153106727345e-05, "loss": 1.3477, "step": 10286 }, { "epoch": 0.28, "learning_rate": 1.6875510861099127e-05, "loss": 1.1934, "step": 10287 }, { "epoch": 0.28, "learning_rate": 1.6874868561680144e-05, "loss": 1.3379, "step": 10288 }, { "epoch": 0.28, "learning_rate": 1.6874226208475425e-05, "loss": 1.4324, "step": 10289 }, { "epoch": 0.28, "learning_rate": 1.687358380148999e-05, "loss": 1.4341, "step": 10290 }, { "epoch": 0.28, "learning_rate": 1.6872941340728867e-05, "loss": 1.2693, "step": 10291 }, { "epoch": 0.28, "learning_rate": 1.6872298826197088e-05, "loss": 1.3872, "step": 10292 }, { "epoch": 0.28, "learning_rate": 1.6871656257899668e-05, "loss": 1.3982, "step": 10293 }, { "epoch": 0.28, "learning_rate": 1.6871013635841644e-05, "loss": 1.3259, "step": 10294 }, { "epoch": 0.28, "learning_rate": 1.6870370960028042e-05, "loss": 1.1597, "step": 10295 }, { "epoch": 0.28, "learning_rate": 1.6869728230463887e-05, "loss": 1.3879, "step": 10296 }, { "epoch": 0.28, "learning_rate": 1.686908544715421e-05, "loss": 1.3638, "step": 10297 }, { "epoch": 0.28, "learning_rate": 1.6868442610104033e-05, "loss": 1.3757, "step": 10298 }, { "epoch": 0.28, "learning_rate": 1.6867799719318395e-05, "loss": 1.323, "step": 10299 }, { "epoch": 0.28, "learning_rate": 1.686715677480232e-05, "loss": 1.71, "step": 10300 }, { "epoch": 0.28, "learning_rate": 1.6866513776560844e-05, "loss": 1.5083, "step": 10301 }, { "epoch": 0.28, "learning_rate": 1.686587072459899e-05, "loss": 1.4331, "step": 10302 }, { "epoch": 0.28, "learning_rate": 1.686522761892179e-05, "loss": 1.3413, "step": 10303 }, { "epoch": 0.28, "learning_rate": 1.6864584459534277e-05, "loss": 1.4031, "step": 10304 }, { "epoch": 0.28, "learning_rate": 1.6863941246441483e-05, "loss": 1.4602, "step": 10305 }, { "epoch": 0.28, "learning_rate": 1.6863297979648444e-05, "loss": 1.4453, "step": 10306 }, { "epoch": 0.28, "learning_rate": 1.686265465916019e-05, "loss": 1.3689, "step": 10307 }, { "epoch": 0.28, "learning_rate": 1.686201128498175e-05, "loss": 1.3596, "step": 10308 }, { "epoch": 0.28, "learning_rate": 1.686136785711816e-05, "loss": 1.2595, "step": 10309 }, { "epoch": 0.28, "learning_rate": 1.6860724375574455e-05, "loss": 1.3721, "step": 10310 }, { "epoch": 0.28, "learning_rate": 1.6860080840355668e-05, "loss": 1.2378, "step": 10311 }, { "epoch": 0.28, "learning_rate": 1.6859437251466838e-05, "loss": 1.5161, "step": 10312 }, { "epoch": 0.28, "learning_rate": 1.685879360891299e-05, "loss": 1.271, "step": 10313 }, { "epoch": 0.28, "learning_rate": 1.685814991269917e-05, "loss": 1.3792, "step": 10314 }, { "epoch": 0.28, "learning_rate": 1.6857506162830414e-05, "loss": 1.4009, "step": 10315 }, { "epoch": 0.28, "learning_rate": 1.6856862359311746e-05, "loss": 1.4578, "step": 10316 }, { "epoch": 0.28, "learning_rate": 1.6856218502148215e-05, "loss": 1.3418, "step": 10317 }, { "epoch": 0.28, "learning_rate": 1.6855574591344855e-05, "loss": 1.4717, "step": 10318 }, { "epoch": 0.28, "learning_rate": 1.6854930626906705e-05, "loss": 1.4858, "step": 10319 }, { "epoch": 0.28, "learning_rate": 1.6854286608838796e-05, "loss": 1.2703, "step": 10320 }, { "epoch": 0.28, "learning_rate": 1.6853642537146176e-05, "loss": 1.2354, "step": 10321 }, { "epoch": 0.28, "learning_rate": 1.6852998411833877e-05, "loss": 1.157, "step": 10322 }, { "epoch": 0.28, "learning_rate": 1.685235423290694e-05, "loss": 1.3677, "step": 10323 }, { "epoch": 0.28, "learning_rate": 1.685171000037041e-05, "loss": 1.2158, "step": 10324 }, { "epoch": 0.28, "learning_rate": 1.685106571422932e-05, "loss": 1.282, "step": 10325 }, { "epoch": 0.28, "learning_rate": 1.6850421374488717e-05, "loss": 1.3333, "step": 10326 }, { "epoch": 0.28, "learning_rate": 1.6849776981153635e-05, "loss": 1.2388, "step": 10327 }, { "epoch": 0.28, "learning_rate": 1.684913253422912e-05, "loss": 1.3367, "step": 10328 }, { "epoch": 0.28, "learning_rate": 1.6848488033720212e-05, "loss": 1.4614, "step": 10329 }, { "epoch": 0.28, "learning_rate": 1.6847843479631955e-05, "loss": 1.282, "step": 10330 }, { "epoch": 0.28, "learning_rate": 1.684719887196939e-05, "loss": 1.3369, "step": 10331 }, { "epoch": 0.28, "learning_rate": 1.6846554210737562e-05, "loss": 1.3613, "step": 10332 }, { "epoch": 0.28, "learning_rate": 1.684590949594151e-05, "loss": 1.3552, "step": 10333 }, { "epoch": 0.28, "learning_rate": 1.6845264727586287e-05, "loss": 1.2751, "step": 10334 }, { "epoch": 0.28, "learning_rate": 1.6844619905676928e-05, "loss": 1.5093, "step": 10335 }, { "epoch": 0.28, "learning_rate": 1.6843975030218478e-05, "loss": 1.2434, "step": 10336 }, { "epoch": 0.28, "learning_rate": 1.684333010121599e-05, "loss": 1.5149, "step": 10337 }, { "epoch": 0.28, "learning_rate": 1.6842685118674506e-05, "loss": 1.446, "step": 10338 }, { "epoch": 0.28, "learning_rate": 1.684204008259907e-05, "loss": 1.4111, "step": 10339 }, { "epoch": 0.28, "learning_rate": 1.6841394992994727e-05, "loss": 1.3816, "step": 10340 }, { "epoch": 0.28, "learning_rate": 1.684074984986653e-05, "loss": 1.3264, "step": 10341 }, { "epoch": 0.28, "learning_rate": 1.6840104653219523e-05, "loss": 1.4141, "step": 10342 }, { "epoch": 0.28, "learning_rate": 1.6839459403058752e-05, "loss": 1.4932, "step": 10343 }, { "epoch": 0.28, "learning_rate": 1.6838814099389268e-05, "loss": 1.3052, "step": 10344 }, { "epoch": 0.28, "learning_rate": 1.6838168742216117e-05, "loss": 1.2917, "step": 10345 }, { "epoch": 0.28, "learning_rate": 1.683752333154435e-05, "loss": 1.4365, "step": 10346 }, { "epoch": 0.28, "learning_rate": 1.6836877867379016e-05, "loss": 1.3088, "step": 10347 }, { "epoch": 0.28, "learning_rate": 1.6836232349725163e-05, "loss": 1.3774, "step": 10348 }, { "epoch": 0.28, "learning_rate": 1.6835586778587844e-05, "loss": 1.4209, "step": 10349 }, { "epoch": 0.28, "learning_rate": 1.683494115397211e-05, "loss": 1.3611, "step": 10350 }, { "epoch": 0.28, "learning_rate": 1.6834295475883007e-05, "loss": 1.2524, "step": 10351 }, { "epoch": 0.28, "learning_rate": 1.6833649744325593e-05, "loss": 1.3862, "step": 10352 }, { "epoch": 0.28, "learning_rate": 1.6833003959304916e-05, "loss": 1.2932, "step": 10353 }, { "epoch": 0.28, "learning_rate": 1.6832358120826028e-05, "loss": 1.3533, "step": 10354 }, { "epoch": 0.28, "learning_rate": 1.6831712228893984e-05, "loss": 1.4011, "step": 10355 }, { "epoch": 0.28, "learning_rate": 1.6831066283513836e-05, "loss": 1.1648, "step": 10356 }, { "epoch": 0.28, "learning_rate": 1.6830420284690635e-05, "loss": 1.4705, "step": 10357 }, { "epoch": 0.28, "learning_rate": 1.682977423242944e-05, "loss": 1.3296, "step": 10358 }, { "epoch": 0.28, "learning_rate": 1.6829128126735303e-05, "loss": 1.4368, "step": 10359 }, { "epoch": 0.28, "learning_rate": 1.6828481967613276e-05, "loss": 1.3918, "step": 10360 }, { "epoch": 0.28, "learning_rate": 1.682783575506842e-05, "loss": 1.4771, "step": 10361 }, { "epoch": 0.28, "learning_rate": 1.682718948910579e-05, "loss": 1.416, "step": 10362 }, { "epoch": 0.28, "learning_rate": 1.6826543169730437e-05, "loss": 1.4922, "step": 10363 }, { "epoch": 0.28, "learning_rate": 1.682589679694742e-05, "loss": 1.3442, "step": 10364 }, { "epoch": 0.28, "learning_rate": 1.6825250370761798e-05, "loss": 1.2368, "step": 10365 }, { "epoch": 0.28, "learning_rate": 1.6824603891178624e-05, "loss": 1.2156, "step": 10366 }, { "epoch": 0.28, "learning_rate": 1.6823957358202955e-05, "loss": 1.4858, "step": 10367 }, { "epoch": 0.28, "learning_rate": 1.682331077183986e-05, "loss": 1.1843, "step": 10368 }, { "epoch": 0.28, "learning_rate": 1.6822664132094387e-05, "loss": 1.2595, "step": 10369 }, { "epoch": 0.28, "learning_rate": 1.6822017438971595e-05, "loss": 1.343, "step": 10370 }, { "epoch": 0.28, "learning_rate": 1.6821370692476552e-05, "loss": 1.3425, "step": 10371 }, { "epoch": 0.28, "learning_rate": 1.682072389261431e-05, "loss": 1.1799, "step": 10372 }, { "epoch": 0.28, "learning_rate": 1.682007703938993e-05, "loss": 1.2993, "step": 10373 }, { "epoch": 0.28, "learning_rate": 1.6819430132808477e-05, "loss": 1.2822, "step": 10374 }, { "epoch": 0.28, "learning_rate": 1.681878317287501e-05, "loss": 1.3464, "step": 10375 }, { "epoch": 0.28, "learning_rate": 1.6818136159594586e-05, "loss": 1.3096, "step": 10376 }, { "epoch": 0.28, "learning_rate": 1.6817489092972274e-05, "loss": 1.3379, "step": 10377 }, { "epoch": 0.28, "learning_rate": 1.681684197301313e-05, "loss": 1.3105, "step": 10378 }, { "epoch": 0.28, "learning_rate": 1.6816194799722224e-05, "loss": 1.301, "step": 10379 }, { "epoch": 0.28, "learning_rate": 1.681554757310461e-05, "loss": 1.4731, "step": 10380 }, { "epoch": 0.28, "learning_rate": 1.681490029316536e-05, "loss": 1.332, "step": 10381 }, { "epoch": 0.28, "learning_rate": 1.6814252959909535e-05, "loss": 1.3662, "step": 10382 }, { "epoch": 0.28, "learning_rate": 1.6813605573342197e-05, "loss": 1.4114, "step": 10383 }, { "epoch": 0.28, "learning_rate": 1.6812958133468416e-05, "loss": 1.3198, "step": 10384 }, { "epoch": 0.28, "learning_rate": 1.681231064029325e-05, "loss": 1.3945, "step": 10385 }, { "epoch": 0.28, "learning_rate": 1.6811663093821776e-05, "loss": 1.2751, "step": 10386 }, { "epoch": 0.28, "learning_rate": 1.6811015494059048e-05, "loss": 1.3086, "step": 10387 }, { "epoch": 0.28, "learning_rate": 1.6810367841010137e-05, "loss": 1.2595, "step": 10388 }, { "epoch": 0.28, "learning_rate": 1.680972013468011e-05, "loss": 1.4536, "step": 10389 }, { "epoch": 0.28, "learning_rate": 1.6809072375074037e-05, "loss": 1.3633, "step": 10390 }, { "epoch": 0.28, "learning_rate": 1.6808424562196982e-05, "loss": 1.3774, "step": 10391 }, { "epoch": 0.28, "learning_rate": 1.680777669605402e-05, "loss": 1.3752, "step": 10392 }, { "epoch": 0.28, "learning_rate": 1.680712877665021e-05, "loss": 1.3572, "step": 10393 }, { "epoch": 0.28, "learning_rate": 1.6806480803990624e-05, "loss": 1.144, "step": 10394 }, { "epoch": 0.28, "learning_rate": 1.6805832778080334e-05, "loss": 1.3459, "step": 10395 }, { "epoch": 0.28, "learning_rate": 1.6805184698924408e-05, "loss": 1.304, "step": 10396 }, { "epoch": 0.28, "learning_rate": 1.6804536566527917e-05, "loss": 1.2476, "step": 10397 }, { "epoch": 0.28, "learning_rate": 1.6803888380895935e-05, "loss": 1.1941, "step": 10398 }, { "epoch": 0.28, "learning_rate": 1.6803240142033525e-05, "loss": 1.2561, "step": 10399 }, { "epoch": 0.28, "learning_rate": 1.6802591849945768e-05, "loss": 1.4011, "step": 10400 }, { "epoch": 0.28, "learning_rate": 1.6801943504637727e-05, "loss": 1.3279, "step": 10401 }, { "epoch": 0.28, "learning_rate": 1.680129510611448e-05, "loss": 1.282, "step": 10402 }, { "epoch": 0.28, "learning_rate": 1.68006466543811e-05, "loss": 1.3467, "step": 10403 }, { "epoch": 0.28, "learning_rate": 1.6799998149442656e-05, "loss": 1.3667, "step": 10404 }, { "epoch": 0.28, "learning_rate": 1.6799349591304225e-05, "loss": 1.3879, "step": 10405 }, { "epoch": 0.28, "learning_rate": 1.679870097997088e-05, "loss": 1.5, "step": 10406 }, { "epoch": 0.28, "learning_rate": 1.6798052315447697e-05, "loss": 1.2224, "step": 10407 }, { "epoch": 0.28, "learning_rate": 1.6797403597739747e-05, "loss": 1.4131, "step": 10408 }, { "epoch": 0.28, "learning_rate": 1.679675482685211e-05, "loss": 1.4321, "step": 10409 }, { "epoch": 0.28, "learning_rate": 1.6796106002789855e-05, "loss": 1.3044, "step": 10410 }, { "epoch": 0.28, "learning_rate": 1.6795457125558067e-05, "loss": 1.4543, "step": 10411 }, { "epoch": 0.28, "learning_rate": 1.6794808195161815e-05, "loss": 1.4922, "step": 10412 }, { "epoch": 0.28, "learning_rate": 1.679415921160618e-05, "loss": 1.2341, "step": 10413 }, { "epoch": 0.28, "learning_rate": 1.6793510174896235e-05, "loss": 1.5776, "step": 10414 }, { "epoch": 0.28, "learning_rate": 1.679286108503707e-05, "loss": 1.3518, "step": 10415 }, { "epoch": 0.28, "learning_rate": 1.6792211942033745e-05, "loss": 1.3242, "step": 10416 }, { "epoch": 0.28, "learning_rate": 1.679156274589135e-05, "loss": 1.5405, "step": 10417 }, { "epoch": 0.28, "learning_rate": 1.6790913496614964e-05, "loss": 1.2368, "step": 10418 }, { "epoch": 0.28, "learning_rate": 1.6790264194209665e-05, "loss": 1.397, "step": 10419 }, { "epoch": 0.28, "learning_rate": 1.678961483868053e-05, "loss": 1.4414, "step": 10420 }, { "epoch": 0.28, "learning_rate": 1.6788965430032636e-05, "loss": 1.1924, "step": 10421 }, { "epoch": 0.28, "learning_rate": 1.6788315968271078e-05, "loss": 1.3071, "step": 10422 }, { "epoch": 0.28, "learning_rate": 1.6787666453400923e-05, "loss": 1.4719, "step": 10423 }, { "epoch": 0.28, "learning_rate": 1.6787016885427258e-05, "loss": 1.2009, "step": 10424 }, { "epoch": 0.28, "learning_rate": 1.6786367264355163e-05, "loss": 1.3735, "step": 10425 }, { "epoch": 0.28, "learning_rate": 1.6785717590189726e-05, "loss": 1.3833, "step": 10426 }, { "epoch": 0.28, "learning_rate": 1.678506786293602e-05, "loss": 1.4106, "step": 10427 }, { "epoch": 0.28, "learning_rate": 1.6784418082599137e-05, "loss": 1.3264, "step": 10428 }, { "epoch": 0.28, "learning_rate": 1.6783768249184156e-05, "loss": 1.3457, "step": 10429 }, { "epoch": 0.28, "learning_rate": 1.6783118362696162e-05, "loss": 1.3092, "step": 10430 }, { "epoch": 0.28, "learning_rate": 1.6782468423140242e-05, "loss": 1.5066, "step": 10431 }, { "epoch": 0.28, "learning_rate": 1.6781818430521475e-05, "loss": 1.3198, "step": 10432 }, { "epoch": 0.28, "learning_rate": 1.678116838484495e-05, "loss": 1.3225, "step": 10433 }, { "epoch": 0.28, "learning_rate": 1.6780518286115755e-05, "loss": 1.1316, "step": 10434 }, { "epoch": 0.28, "learning_rate": 1.677986813433897e-05, "loss": 1.3889, "step": 10435 }, { "epoch": 0.29, "learning_rate": 1.6779217929519686e-05, "loss": 1.2695, "step": 10436 }, { "epoch": 0.29, "learning_rate": 1.6778567671662994e-05, "loss": 1.2795, "step": 10437 }, { "epoch": 0.29, "learning_rate": 1.677791736077397e-05, "loss": 1.3181, "step": 10438 }, { "epoch": 0.29, "learning_rate": 1.6777266996857707e-05, "loss": 1.604, "step": 10439 }, { "epoch": 0.29, "learning_rate": 1.6776616579919296e-05, "loss": 1.3418, "step": 10440 }, { "epoch": 0.29, "learning_rate": 1.6775966109963823e-05, "loss": 1.2268, "step": 10441 }, { "epoch": 0.29, "learning_rate": 1.677531558699638e-05, "loss": 1.2346, "step": 10442 }, { "epoch": 0.29, "learning_rate": 1.677466501102205e-05, "loss": 1.3943, "step": 10443 }, { "epoch": 0.29, "learning_rate": 1.6774014382045928e-05, "loss": 1.2361, "step": 10444 }, { "epoch": 0.29, "learning_rate": 1.6773363700073107e-05, "loss": 1.4297, "step": 10445 }, { "epoch": 0.29, "learning_rate": 1.6772712965108668e-05, "loss": 1.3459, "step": 10446 }, { "epoch": 0.29, "learning_rate": 1.6772062177157708e-05, "loss": 1.344, "step": 10447 }, { "epoch": 0.29, "learning_rate": 1.677141133622532e-05, "loss": 1.3699, "step": 10448 }, { "epoch": 0.29, "learning_rate": 1.6770760442316593e-05, "loss": 1.3496, "step": 10449 }, { "epoch": 0.29, "learning_rate": 1.677010949543662e-05, "loss": 1.2974, "step": 10450 }, { "epoch": 0.29, "learning_rate": 1.6769458495590495e-05, "loss": 1.4131, "step": 10451 }, { "epoch": 0.29, "learning_rate": 1.676880744278331e-05, "loss": 1.4097, "step": 10452 }, { "epoch": 0.29, "learning_rate": 1.6768156337020155e-05, "loss": 1.2346, "step": 10453 }, { "epoch": 0.29, "learning_rate": 1.6767505178306133e-05, "loss": 1.3152, "step": 10454 }, { "epoch": 0.29, "learning_rate": 1.6766853966646327e-05, "loss": 1.2737, "step": 10455 }, { "epoch": 0.29, "learning_rate": 1.676620270204584e-05, "loss": 1.4292, "step": 10456 }, { "epoch": 0.29, "learning_rate": 1.6765551384509766e-05, "loss": 1.4448, "step": 10457 }, { "epoch": 0.29, "learning_rate": 1.67649000140432e-05, "loss": 1.2524, "step": 10458 }, { "epoch": 0.29, "learning_rate": 1.6764248590651235e-05, "loss": 1.1396, "step": 10459 }, { "epoch": 0.29, "learning_rate": 1.676359711433897e-05, "loss": 1.3184, "step": 10460 }, { "epoch": 0.29, "learning_rate": 1.6762945585111503e-05, "loss": 1.4907, "step": 10461 }, { "epoch": 0.29, "learning_rate": 1.676229400297393e-05, "loss": 1.3679, "step": 10462 }, { "epoch": 0.29, "learning_rate": 1.6761642367931346e-05, "loss": 1.3633, "step": 10463 }, { "epoch": 0.29, "learning_rate": 1.6760990679988855e-05, "loss": 1.4272, "step": 10464 }, { "epoch": 0.29, "learning_rate": 1.6760338939151548e-05, "loss": 1.4221, "step": 10465 }, { "epoch": 0.29, "learning_rate": 1.675968714542453e-05, "loss": 1.4548, "step": 10466 }, { "epoch": 0.29, "learning_rate": 1.67590352988129e-05, "loss": 1.3306, "step": 10467 }, { "epoch": 0.29, "learning_rate": 1.6758383399321756e-05, "loss": 1.4343, "step": 10468 }, { "epoch": 0.29, "learning_rate": 1.6757731446956198e-05, "loss": 1.2217, "step": 10469 }, { "epoch": 0.29, "learning_rate": 1.6757079441721328e-05, "loss": 1.4424, "step": 10470 }, { "epoch": 0.29, "learning_rate": 1.6756427383622243e-05, "loss": 1.3564, "step": 10471 }, { "epoch": 0.29, "learning_rate": 1.675577527266405e-05, "loss": 1.1667, "step": 10472 }, { "epoch": 0.29, "learning_rate": 1.6755123108851846e-05, "loss": 1.2043, "step": 10473 }, { "epoch": 0.29, "learning_rate": 1.6754470892190735e-05, "loss": 1.4316, "step": 10474 }, { "epoch": 0.29, "learning_rate": 1.6753818622685817e-05, "loss": 1.1443, "step": 10475 }, { "epoch": 0.29, "learning_rate": 1.6753166300342204e-05, "loss": 1.373, "step": 10476 }, { "epoch": 0.29, "learning_rate": 1.675251392516499e-05, "loss": 1.5117, "step": 10477 }, { "epoch": 0.29, "learning_rate": 1.6751861497159285e-05, "loss": 1.3059, "step": 10478 }, { "epoch": 0.29, "learning_rate": 1.6751209016330186e-05, "loss": 1.157, "step": 10479 }, { "epoch": 0.29, "learning_rate": 1.6750556482682807e-05, "loss": 1.373, "step": 10480 }, { "epoch": 0.29, "learning_rate": 1.6749903896222246e-05, "loss": 1.1843, "step": 10481 }, { "epoch": 0.29, "learning_rate": 1.6749251256953613e-05, "loss": 1.1626, "step": 10482 }, { "epoch": 0.29, "learning_rate": 1.674859856488201e-05, "loss": 1.3152, "step": 10483 }, { "epoch": 0.29, "learning_rate": 1.6747945820012548e-05, "loss": 1.3916, "step": 10484 }, { "epoch": 0.29, "learning_rate": 1.674729302235033e-05, "loss": 1.3899, "step": 10485 }, { "epoch": 0.29, "learning_rate": 1.674664017190046e-05, "loss": 1.3447, "step": 10486 }, { "epoch": 0.29, "learning_rate": 1.6745987268668053e-05, "loss": 1.2412, "step": 10487 }, { "epoch": 0.29, "learning_rate": 1.674533431265821e-05, "loss": 1.2302, "step": 10488 }, { "epoch": 0.29, "learning_rate": 1.674468130387605e-05, "loss": 1.4019, "step": 10489 }, { "epoch": 0.29, "learning_rate": 1.6744028242326674e-05, "loss": 1.2961, "step": 10490 }, { "epoch": 0.29, "learning_rate": 1.6743375128015187e-05, "loss": 1.282, "step": 10491 }, { "epoch": 0.29, "learning_rate": 1.6742721960946707e-05, "loss": 1.343, "step": 10492 }, { "epoch": 0.29, "learning_rate": 1.6742068741126344e-05, "loss": 1.3975, "step": 10493 }, { "epoch": 0.29, "learning_rate": 1.67414154685592e-05, "loss": 1.3257, "step": 10494 }, { "epoch": 0.29, "learning_rate": 1.6740762143250395e-05, "loss": 1.4009, "step": 10495 }, { "epoch": 0.29, "learning_rate": 1.6740108765205036e-05, "loss": 1.4365, "step": 10496 }, { "epoch": 0.29, "learning_rate": 1.6739455334428233e-05, "loss": 1.3481, "step": 10497 }, { "epoch": 0.29, "learning_rate": 1.6738801850925103e-05, "loss": 1.3159, "step": 10498 }, { "epoch": 0.29, "learning_rate": 1.6738148314700756e-05, "loss": 1.3396, "step": 10499 }, { "epoch": 0.29, "learning_rate": 1.6737494725760307e-05, "loss": 1.342, "step": 10500 }, { "epoch": 0.29, "learning_rate": 1.6736841084108865e-05, "loss": 1.4514, "step": 10501 }, { "epoch": 0.29, "learning_rate": 1.6736187389751547e-05, "loss": 1.2666, "step": 10502 }, { "epoch": 0.29, "learning_rate": 1.6735533642693465e-05, "loss": 1.4485, "step": 10503 }, { "epoch": 0.29, "learning_rate": 1.673487984293974e-05, "loss": 1.3547, "step": 10504 }, { "epoch": 0.29, "learning_rate": 1.6734225990495475e-05, "loss": 1.3687, "step": 10505 }, { "epoch": 0.29, "learning_rate": 1.6733572085365795e-05, "loss": 1.4043, "step": 10506 }, { "epoch": 0.29, "learning_rate": 1.6732918127555816e-05, "loss": 1.488, "step": 10507 }, { "epoch": 0.29, "learning_rate": 1.6732264117070647e-05, "loss": 1.2427, "step": 10508 }, { "epoch": 0.29, "learning_rate": 1.6731610053915414e-05, "loss": 1.6875, "step": 10509 }, { "epoch": 0.29, "learning_rate": 1.6730955938095226e-05, "loss": 1.3499, "step": 10510 }, { "epoch": 0.29, "learning_rate": 1.6730301769615204e-05, "loss": 1.283, "step": 10511 }, { "epoch": 0.29, "learning_rate": 1.672964754848047e-05, "loss": 1.3193, "step": 10512 }, { "epoch": 0.29, "learning_rate": 1.6728993274696135e-05, "loss": 1.4092, "step": 10513 }, { "epoch": 0.29, "learning_rate": 1.672833894826732e-05, "loss": 1.2229, "step": 10514 }, { "epoch": 0.29, "learning_rate": 1.6727684569199146e-05, "loss": 1.3735, "step": 10515 }, { "epoch": 0.29, "learning_rate": 1.672703013749673e-05, "loss": 1.2532, "step": 10516 }, { "epoch": 0.29, "learning_rate": 1.6726375653165193e-05, "loss": 1.4443, "step": 10517 }, { "epoch": 0.29, "learning_rate": 1.672572111620966e-05, "loss": 1.1895, "step": 10518 }, { "epoch": 0.29, "learning_rate": 1.6725066526635244e-05, "loss": 1.5063, "step": 10519 }, { "epoch": 0.29, "learning_rate": 1.6724411884447072e-05, "loss": 1.2124, "step": 10520 }, { "epoch": 0.29, "learning_rate": 1.6723757189650263e-05, "loss": 1.4741, "step": 10521 }, { "epoch": 0.29, "learning_rate": 1.6723102442249937e-05, "loss": 1.1609, "step": 10522 }, { "epoch": 0.29, "learning_rate": 1.672244764225122e-05, "loss": 1.3936, "step": 10523 }, { "epoch": 0.29, "learning_rate": 1.6721792789659236e-05, "loss": 1.3677, "step": 10524 }, { "epoch": 0.29, "learning_rate": 1.6721137884479108e-05, "loss": 1.2598, "step": 10525 }, { "epoch": 0.29, "learning_rate": 1.6720482926715953e-05, "loss": 1.3628, "step": 10526 }, { "epoch": 0.29, "learning_rate": 1.6719827916374902e-05, "loss": 1.3091, "step": 10527 }, { "epoch": 0.29, "learning_rate": 1.6719172853461074e-05, "loss": 1.2231, "step": 10528 }, { "epoch": 0.29, "learning_rate": 1.6718517737979602e-05, "loss": 1.2738, "step": 10529 }, { "epoch": 0.29, "learning_rate": 1.6717862569935603e-05, "loss": 1.4392, "step": 10530 }, { "epoch": 0.29, "learning_rate": 1.6717207349334208e-05, "loss": 1.7314, "step": 10531 }, { "epoch": 0.29, "learning_rate": 1.671655207618054e-05, "loss": 1.3381, "step": 10532 }, { "epoch": 0.29, "learning_rate": 1.671589675047973e-05, "loss": 1.4731, "step": 10533 }, { "epoch": 0.29, "learning_rate": 1.6715241372236897e-05, "loss": 1.3677, "step": 10534 }, { "epoch": 0.29, "learning_rate": 1.6714585941457175e-05, "loss": 1.197, "step": 10535 }, { "epoch": 0.29, "learning_rate": 1.6713930458145693e-05, "loss": 1.4043, "step": 10536 }, { "epoch": 0.29, "learning_rate": 1.6713274922307573e-05, "loss": 1.4187, "step": 10537 }, { "epoch": 0.29, "learning_rate": 1.671261933394795e-05, "loss": 1.2559, "step": 10538 }, { "epoch": 0.29, "learning_rate": 1.6711963693071943e-05, "loss": 1.2859, "step": 10539 }, { "epoch": 0.29, "learning_rate": 1.6711307999684696e-05, "loss": 1.7349, "step": 10540 }, { "epoch": 0.29, "learning_rate": 1.6710652253791326e-05, "loss": 1.425, "step": 10541 }, { "epoch": 0.29, "learning_rate": 1.670999645539697e-05, "loss": 1.4197, "step": 10542 }, { "epoch": 0.29, "learning_rate": 1.670934060450676e-05, "loss": 1.4692, "step": 10543 }, { "epoch": 0.29, "learning_rate": 1.6708684701125818e-05, "loss": 1.3574, "step": 10544 }, { "epoch": 0.29, "learning_rate": 1.670802874525929e-05, "loss": 1.3328, "step": 10545 }, { "epoch": 0.29, "learning_rate": 1.670737273691229e-05, "loss": 1.2253, "step": 10546 }, { "epoch": 0.29, "learning_rate": 1.6706716676089963e-05, "loss": 1.4753, "step": 10547 }, { "epoch": 0.29, "learning_rate": 1.670606056279744e-05, "loss": 1.354, "step": 10548 }, { "epoch": 0.29, "learning_rate": 1.6705404397039852e-05, "loss": 1.3975, "step": 10549 }, { "epoch": 0.29, "learning_rate": 1.6704748178822337e-05, "loss": 1.3152, "step": 10550 }, { "epoch": 0.29, "learning_rate": 1.670409190815002e-05, "loss": 1.2415, "step": 10551 }, { "epoch": 0.29, "learning_rate": 1.670343558502804e-05, "loss": 1.5305, "step": 10552 }, { "epoch": 0.29, "learning_rate": 1.6702779209461532e-05, "loss": 1.3433, "step": 10553 }, { "epoch": 0.29, "learning_rate": 1.6702122781455634e-05, "loss": 1.2944, "step": 10554 }, { "epoch": 0.29, "learning_rate": 1.670146630101548e-05, "loss": 1.3093, "step": 10555 }, { "epoch": 0.29, "learning_rate": 1.6700809768146203e-05, "loss": 1.3975, "step": 10556 }, { "epoch": 0.29, "learning_rate": 1.670015318285294e-05, "loss": 1.3618, "step": 10557 }, { "epoch": 0.29, "learning_rate": 1.669949654514083e-05, "loss": 1.2327, "step": 10558 }, { "epoch": 0.29, "learning_rate": 1.669883985501501e-05, "loss": 1.3782, "step": 10559 }, { "epoch": 0.29, "learning_rate": 1.6698183112480618e-05, "loss": 1.3721, "step": 10560 }, { "epoch": 0.29, "learning_rate": 1.669752631754279e-05, "loss": 1.3352, "step": 10561 }, { "epoch": 0.29, "learning_rate": 1.6696869470206666e-05, "loss": 1.4089, "step": 10562 }, { "epoch": 0.29, "learning_rate": 1.6696212570477382e-05, "loss": 1.4241, "step": 10563 }, { "epoch": 0.29, "learning_rate": 1.6695555618360083e-05, "loss": 1.4438, "step": 10564 }, { "epoch": 0.29, "learning_rate": 1.66948986138599e-05, "loss": 1.3052, "step": 10565 }, { "epoch": 0.29, "learning_rate": 1.6694241556981984e-05, "loss": 1.459, "step": 10566 }, { "epoch": 0.29, "learning_rate": 1.6693584447731467e-05, "loss": 1.3794, "step": 10567 }, { "epoch": 0.29, "learning_rate": 1.6692927286113494e-05, "loss": 1.321, "step": 10568 }, { "epoch": 0.29, "learning_rate": 1.6692270072133205e-05, "loss": 1.2083, "step": 10569 }, { "epoch": 0.29, "learning_rate": 1.6691612805795742e-05, "loss": 1.4033, "step": 10570 }, { "epoch": 0.29, "learning_rate": 1.6690955487106246e-05, "loss": 1.3252, "step": 10571 }, { "epoch": 0.29, "learning_rate": 1.6690298116069863e-05, "loss": 1.4526, "step": 10572 }, { "epoch": 0.29, "learning_rate": 1.668964069269173e-05, "loss": 1.301, "step": 10573 }, { "epoch": 0.29, "learning_rate": 1.6688983216976996e-05, "loss": 1.2981, "step": 10574 }, { "epoch": 0.29, "learning_rate": 1.6688325688930804e-05, "loss": 1.3428, "step": 10575 }, { "epoch": 0.29, "learning_rate": 1.6687668108558296e-05, "loss": 1.3442, "step": 10576 }, { "epoch": 0.29, "learning_rate": 1.6687010475864616e-05, "loss": 1.4001, "step": 10577 }, { "epoch": 0.29, "learning_rate": 1.668635279085491e-05, "loss": 1.252, "step": 10578 }, { "epoch": 0.29, "learning_rate": 1.6685695053534327e-05, "loss": 1.2581, "step": 10579 }, { "epoch": 0.29, "learning_rate": 1.6685037263908007e-05, "loss": 1.3499, "step": 10580 }, { "epoch": 0.29, "learning_rate": 1.66843794219811e-05, "loss": 1.3005, "step": 10581 }, { "epoch": 0.29, "learning_rate": 1.668372152775875e-05, "loss": 1.3147, "step": 10582 }, { "epoch": 0.29, "learning_rate": 1.668306358124611e-05, "loss": 1.292, "step": 10583 }, { "epoch": 0.29, "learning_rate": 1.6682405582448317e-05, "loss": 1.3501, "step": 10584 }, { "epoch": 0.29, "learning_rate": 1.668174753137053e-05, "loss": 1.2815, "step": 10585 }, { "epoch": 0.29, "learning_rate": 1.668108942801789e-05, "loss": 1.3901, "step": 10586 }, { "epoch": 0.29, "learning_rate": 1.668043127239555e-05, "loss": 1.4932, "step": 10587 }, { "epoch": 0.29, "learning_rate": 1.6679773064508652e-05, "loss": 1.7422, "step": 10588 }, { "epoch": 0.29, "learning_rate": 1.6679114804362354e-05, "loss": 1.3745, "step": 10589 }, { "epoch": 0.29, "learning_rate": 1.6678456491961804e-05, "loss": 1.3264, "step": 10590 }, { "epoch": 0.29, "learning_rate": 1.667779812731215e-05, "loss": 1.7104, "step": 10591 }, { "epoch": 0.29, "learning_rate": 1.6677139710418547e-05, "loss": 1.3638, "step": 10592 }, { "epoch": 0.29, "learning_rate": 1.6676481241286134e-05, "loss": 1.302, "step": 10593 }, { "epoch": 0.29, "learning_rate": 1.667582271992008e-05, "loss": 1.3396, "step": 10594 }, { "epoch": 0.29, "learning_rate": 1.6675164146325525e-05, "loss": 1.1624, "step": 10595 }, { "epoch": 0.29, "learning_rate": 1.6674505520507622e-05, "loss": 1.3218, "step": 10596 }, { "epoch": 0.29, "learning_rate": 1.667384684247153e-05, "loss": 1.4309, "step": 10597 }, { "epoch": 0.29, "learning_rate": 1.6673188112222394e-05, "loss": 1.4185, "step": 10598 }, { "epoch": 0.29, "learning_rate": 1.6672529329765376e-05, "loss": 1.4404, "step": 10599 }, { "epoch": 0.29, "learning_rate": 1.6671870495105625e-05, "loss": 1.7642, "step": 10600 }, { "epoch": 0.29, "learning_rate": 1.66712116082483e-05, "loss": 1.4277, "step": 10601 }, { "epoch": 0.29, "learning_rate": 1.6670552669198547e-05, "loss": 1.3196, "step": 10602 }, { "epoch": 0.29, "learning_rate": 1.6669893677961527e-05, "loss": 1.4807, "step": 10603 }, { "epoch": 0.29, "learning_rate": 1.66692346345424e-05, "loss": 1.3794, "step": 10604 }, { "epoch": 0.29, "learning_rate": 1.6668575538946315e-05, "loss": 1.4221, "step": 10605 }, { "epoch": 0.29, "learning_rate": 1.666791639117843e-05, "loss": 1.3228, "step": 10606 }, { "epoch": 0.29, "learning_rate": 1.6667257191243903e-05, "loss": 1.2666, "step": 10607 }, { "epoch": 0.29, "learning_rate": 1.666659793914789e-05, "loss": 1.4272, "step": 10608 }, { "epoch": 0.29, "learning_rate": 1.666593863489555e-05, "loss": 1.2354, "step": 10609 }, { "epoch": 0.29, "learning_rate": 1.6665279278492043e-05, "loss": 1.2844, "step": 10610 }, { "epoch": 0.29, "learning_rate": 1.6664619869942524e-05, "loss": 1.3359, "step": 10611 }, { "epoch": 0.29, "learning_rate": 1.666396040925215e-05, "loss": 1.2439, "step": 10612 }, { "epoch": 0.29, "learning_rate": 1.6663300896426088e-05, "loss": 1.4373, "step": 10613 }, { "epoch": 0.29, "learning_rate": 1.666264133146949e-05, "loss": 1.2957, "step": 10614 }, { "epoch": 0.29, "learning_rate": 1.666198171438752e-05, "loss": 1.3972, "step": 10615 }, { "epoch": 0.29, "learning_rate": 1.6661322045185334e-05, "loss": 1.3286, "step": 10616 }, { "epoch": 0.29, "learning_rate": 1.6660662323868103e-05, "loss": 1.3398, "step": 10617 }, { "epoch": 0.29, "learning_rate": 1.6660002550440978e-05, "loss": 1.3984, "step": 10618 }, { "epoch": 0.29, "learning_rate": 1.6659342724909126e-05, "loss": 1.4526, "step": 10619 }, { "epoch": 0.29, "learning_rate": 1.665868284727771e-05, "loss": 1.355, "step": 10620 }, { "epoch": 0.29, "learning_rate": 1.6658022917551888e-05, "loss": 1.3186, "step": 10621 }, { "epoch": 0.29, "learning_rate": 1.6657362935736826e-05, "loss": 1.3696, "step": 10622 }, { "epoch": 0.29, "learning_rate": 1.6656702901837688e-05, "loss": 1.3811, "step": 10623 }, { "epoch": 0.29, "learning_rate": 1.6656042815859637e-05, "loss": 1.4233, "step": 10624 }, { "epoch": 0.29, "learning_rate": 1.6655382677807837e-05, "loss": 1.1782, "step": 10625 }, { "epoch": 0.29, "learning_rate": 1.6654722487687448e-05, "loss": 1.3796, "step": 10626 }, { "epoch": 0.29, "learning_rate": 1.6654062245503646e-05, "loss": 1.4629, "step": 10627 }, { "epoch": 0.29, "learning_rate": 1.6653401951261586e-05, "loss": 1.4583, "step": 10628 }, { "epoch": 0.29, "learning_rate": 1.6652741604966438e-05, "loss": 1.3398, "step": 10629 }, { "epoch": 0.29, "learning_rate": 1.6652081206623368e-05, "loss": 1.4585, "step": 10630 }, { "epoch": 0.29, "learning_rate": 1.6651420756237543e-05, "loss": 1.3301, "step": 10631 }, { "epoch": 0.29, "learning_rate": 1.6650760253814128e-05, "loss": 1.3679, "step": 10632 }, { "epoch": 0.29, "learning_rate": 1.6650099699358295e-05, "loss": 1.1763, "step": 10633 }, { "epoch": 0.29, "learning_rate": 1.664943909287521e-05, "loss": 1.3079, "step": 10634 }, { "epoch": 0.29, "learning_rate": 1.6648778434370037e-05, "loss": 1.7422, "step": 10635 }, { "epoch": 0.29, "learning_rate": 1.664811772384795e-05, "loss": 1.3599, "step": 10636 }, { "epoch": 0.29, "learning_rate": 1.6647456961314117e-05, "loss": 1.3362, "step": 10637 }, { "epoch": 0.29, "learning_rate": 1.6646796146773703e-05, "loss": 1.4561, "step": 10638 }, { "epoch": 0.29, "learning_rate": 1.6646135280231884e-05, "loss": 1.2986, "step": 10639 }, { "epoch": 0.29, "learning_rate": 1.6645474361693826e-05, "loss": 1.3364, "step": 10640 }, { "epoch": 0.29, "learning_rate": 1.6644813391164703e-05, "loss": 1.4214, "step": 10641 }, { "epoch": 0.29, "learning_rate": 1.6644152368649685e-05, "loss": 1.4688, "step": 10642 }, { "epoch": 0.29, "learning_rate": 1.6643491294153946e-05, "loss": 1.3306, "step": 10643 }, { "epoch": 0.29, "learning_rate": 1.6642830167682652e-05, "loss": 1.3604, "step": 10644 }, { "epoch": 0.29, "learning_rate": 1.6642168989240977e-05, "loss": 1.3911, "step": 10645 }, { "epoch": 0.29, "learning_rate": 1.6641507758834096e-05, "loss": 1.3743, "step": 10646 }, { "epoch": 0.29, "learning_rate": 1.664084647646718e-05, "loss": 1.3298, "step": 10647 }, { "epoch": 0.29, "learning_rate": 1.664018514214541e-05, "loss": 1.363, "step": 10648 }, { "epoch": 0.29, "learning_rate": 1.663952375587395e-05, "loss": 1.3833, "step": 10649 }, { "epoch": 0.29, "learning_rate": 1.6638862317657976e-05, "loss": 1.4001, "step": 10650 }, { "epoch": 0.29, "learning_rate": 1.6638200827502667e-05, "loss": 1.4089, "step": 10651 }, { "epoch": 0.29, "learning_rate": 1.6637539285413194e-05, "loss": 1.3157, "step": 10652 }, { "epoch": 0.29, "learning_rate": 1.663687769139474e-05, "loss": 1.4238, "step": 10653 }, { "epoch": 0.29, "learning_rate": 1.6636216045452475e-05, "loss": 1.2314, "step": 10654 }, { "epoch": 0.29, "learning_rate": 1.6635554347591572e-05, "loss": 1.2083, "step": 10655 }, { "epoch": 0.29, "learning_rate": 1.6634892597817213e-05, "loss": 1.4836, "step": 10656 }, { "epoch": 0.29, "learning_rate": 1.6634230796134578e-05, "loss": 1.3857, "step": 10657 }, { "epoch": 0.29, "learning_rate": 1.6633568942548833e-05, "loss": 1.3079, "step": 10658 }, { "epoch": 0.29, "learning_rate": 1.6632907037065173e-05, "loss": 1.3232, "step": 10659 }, { "epoch": 0.29, "learning_rate": 1.6632245079688764e-05, "loss": 1.4141, "step": 10660 }, { "epoch": 0.29, "learning_rate": 1.6631583070424784e-05, "loss": 1.3142, "step": 10661 }, { "epoch": 0.29, "learning_rate": 1.6630921009278424e-05, "loss": 1.2571, "step": 10662 }, { "epoch": 0.29, "learning_rate": 1.6630258896254853e-05, "loss": 1.4312, "step": 10663 }, { "epoch": 0.29, "learning_rate": 1.662959673135925e-05, "loss": 1.3359, "step": 10664 }, { "epoch": 0.29, "learning_rate": 1.6628934514596804e-05, "loss": 1.3916, "step": 10665 }, { "epoch": 0.29, "learning_rate": 1.662827224597269e-05, "loss": 1.3875, "step": 10666 }, { "epoch": 0.29, "learning_rate": 1.6627609925492092e-05, "loss": 1.2173, "step": 10667 }, { "epoch": 0.29, "learning_rate": 1.6626947553160193e-05, "loss": 1.3152, "step": 10668 }, { "epoch": 0.29, "learning_rate": 1.662628512898217e-05, "loss": 1.3411, "step": 10669 }, { "epoch": 0.29, "learning_rate": 1.6625622652963204e-05, "loss": 1.4822, "step": 10670 }, { "epoch": 0.29, "learning_rate": 1.6624960125108486e-05, "loss": 1.2708, "step": 10671 }, { "epoch": 0.29, "learning_rate": 1.6624297545423195e-05, "loss": 1.3633, "step": 10672 }, { "epoch": 0.29, "learning_rate": 1.6623634913912515e-05, "loss": 1.4097, "step": 10673 }, { "epoch": 0.29, "learning_rate": 1.662297223058163e-05, "loss": 1.3591, "step": 10674 }, { "epoch": 0.29, "learning_rate": 1.6622309495435723e-05, "loss": 1.3601, "step": 10675 }, { "epoch": 0.29, "learning_rate": 1.6621646708479983e-05, "loss": 1.3604, "step": 10676 }, { "epoch": 0.29, "learning_rate": 1.662098386971959e-05, "loss": 1.3042, "step": 10677 }, { "epoch": 0.29, "learning_rate": 1.6620320979159735e-05, "loss": 1.4062, "step": 10678 }, { "epoch": 0.29, "learning_rate": 1.66196580368056e-05, "loss": 1.3584, "step": 10679 }, { "epoch": 0.29, "learning_rate": 1.6618995042662374e-05, "loss": 1.3406, "step": 10680 }, { "epoch": 0.29, "learning_rate": 1.6618331996735248e-05, "loss": 1.3477, "step": 10681 }, { "epoch": 0.29, "learning_rate": 1.6617668899029394e-05, "loss": 1.3069, "step": 10682 }, { "epoch": 0.29, "learning_rate": 1.661700574955002e-05, "loss": 1.6504, "step": 10683 }, { "epoch": 0.29, "learning_rate": 1.6616342548302303e-05, "loss": 1.374, "step": 10684 }, { "epoch": 0.29, "learning_rate": 1.661567929529143e-05, "loss": 1.2966, "step": 10685 }, { "epoch": 0.29, "learning_rate": 1.6615015990522592e-05, "loss": 1.4434, "step": 10686 }, { "epoch": 0.29, "learning_rate": 1.6614352634000983e-05, "loss": 1.4224, "step": 10687 }, { "epoch": 0.29, "learning_rate": 1.661368922573179e-05, "loss": 1.2874, "step": 10688 }, { "epoch": 0.29, "learning_rate": 1.66130257657202e-05, "loss": 1.355, "step": 10689 }, { "epoch": 0.29, "learning_rate": 1.6612362253971408e-05, "loss": 1.3164, "step": 10690 }, { "epoch": 0.29, "learning_rate": 1.66116986904906e-05, "loss": 1.2795, "step": 10691 }, { "epoch": 0.29, "learning_rate": 1.661103507528297e-05, "loss": 1.3171, "step": 10692 }, { "epoch": 0.29, "learning_rate": 1.6610371408353713e-05, "loss": 1.2501, "step": 10693 }, { "epoch": 0.29, "learning_rate": 1.660970768970802e-05, "loss": 1.2646, "step": 10694 }, { "epoch": 0.29, "learning_rate": 1.660904391935108e-05, "loss": 1.207, "step": 10695 }, { "epoch": 0.29, "learning_rate": 1.6608380097288087e-05, "loss": 1.3191, "step": 10696 }, { "epoch": 0.29, "learning_rate": 1.660771622352424e-05, "loss": 1.293, "step": 10697 }, { "epoch": 0.29, "learning_rate": 1.6607052298064722e-05, "loss": 1.1289, "step": 10698 }, { "epoch": 0.29, "learning_rate": 1.660638832091474e-05, "loss": 1.2042, "step": 10699 }, { "epoch": 0.29, "learning_rate": 1.6605724292079476e-05, "loss": 1.189, "step": 10700 }, { "epoch": 0.29, "learning_rate": 1.660506021156414e-05, "loss": 1.2554, "step": 10701 }, { "epoch": 0.29, "learning_rate": 1.660439607937391e-05, "loss": 1.4307, "step": 10702 }, { "epoch": 0.29, "learning_rate": 1.6603731895513996e-05, "loss": 1.2703, "step": 10703 }, { "epoch": 0.29, "learning_rate": 1.6603067659989587e-05, "loss": 1.3582, "step": 10704 }, { "epoch": 0.29, "learning_rate": 1.6602403372805882e-05, "loss": 1.2932, "step": 10705 }, { "epoch": 0.29, "learning_rate": 1.6601739033968075e-05, "loss": 1.4009, "step": 10706 }, { "epoch": 0.29, "learning_rate": 1.660107464348137e-05, "loss": 1.4426, "step": 10707 }, { "epoch": 0.29, "learning_rate": 1.6600410201350962e-05, "loss": 1.2429, "step": 10708 }, { "epoch": 0.29, "learning_rate": 1.6599745707582043e-05, "loss": 1.4658, "step": 10709 }, { "epoch": 0.29, "learning_rate": 1.6599081162179823e-05, "loss": 1.3254, "step": 10710 }, { "epoch": 0.29, "learning_rate": 1.659841656514949e-05, "loss": 1.1904, "step": 10711 }, { "epoch": 0.29, "learning_rate": 1.659775191649625e-05, "loss": 1.4202, "step": 10712 }, { "epoch": 0.29, "learning_rate": 1.6597087216225304e-05, "loss": 1.3184, "step": 10713 }, { "epoch": 0.29, "learning_rate": 1.6596422464341845e-05, "loss": 1.4468, "step": 10714 }, { "epoch": 0.29, "learning_rate": 1.6595757660851084e-05, "loss": 1.1519, "step": 10715 }, { "epoch": 0.29, "learning_rate": 1.6595092805758212e-05, "loss": 1.5605, "step": 10716 }, { "epoch": 0.29, "learning_rate": 1.659442789906844e-05, "loss": 1.5857, "step": 10717 }, { "epoch": 0.29, "learning_rate": 1.659376294078696e-05, "loss": 1.4287, "step": 10718 }, { "epoch": 0.29, "learning_rate": 1.6593097930918984e-05, "loss": 1.366, "step": 10719 }, { "epoch": 0.29, "learning_rate": 1.6592432869469706e-05, "loss": 1.4575, "step": 10720 }, { "epoch": 0.29, "learning_rate": 1.6591767756444338e-05, "loss": 1.3419, "step": 10721 }, { "epoch": 0.29, "learning_rate": 1.6591102591848073e-05, "loss": 1.2268, "step": 10722 }, { "epoch": 0.29, "learning_rate": 1.6590437375686123e-05, "loss": 1.4182, "step": 10723 }, { "epoch": 0.29, "learning_rate": 1.6589772107963692e-05, "loss": 1.3298, "step": 10724 }, { "epoch": 0.29, "learning_rate": 1.658910678868598e-05, "loss": 1.5659, "step": 10725 }, { "epoch": 0.29, "learning_rate": 1.6588441417858196e-05, "loss": 1.2117, "step": 10726 }, { "epoch": 0.29, "learning_rate": 1.6587775995485543e-05, "loss": 1.3186, "step": 10727 }, { "epoch": 0.29, "learning_rate": 1.6587110521573232e-05, "loss": 1.3076, "step": 10728 }, { "epoch": 0.29, "learning_rate": 1.658644499612646e-05, "loss": 1.3621, "step": 10729 }, { "epoch": 0.29, "learning_rate": 1.6585779419150445e-05, "loss": 1.3479, "step": 10730 }, { "epoch": 0.29, "learning_rate": 1.658511379065039e-05, "loss": 1.3425, "step": 10731 }, { "epoch": 0.29, "learning_rate": 1.6584448110631496e-05, "loss": 1.24, "step": 10732 }, { "epoch": 0.29, "learning_rate": 1.6583782379098977e-05, "loss": 1.2808, "step": 10733 }, { "epoch": 0.29, "learning_rate": 1.658311659605804e-05, "loss": 1.2883, "step": 10734 }, { "epoch": 0.29, "learning_rate": 1.65824507615139e-05, "loss": 1.3037, "step": 10735 }, { "epoch": 0.29, "learning_rate": 1.6581784875471757e-05, "loss": 1.3604, "step": 10736 }, { "epoch": 0.29, "learning_rate": 1.6581118937936823e-05, "loss": 1.385, "step": 10737 }, { "epoch": 0.29, "learning_rate": 1.658045294891431e-05, "loss": 1.1936, "step": 10738 }, { "epoch": 0.29, "learning_rate": 1.6579786908409427e-05, "loss": 1.3887, "step": 10739 }, { "epoch": 0.29, "learning_rate": 1.6579120816427387e-05, "loss": 1.2852, "step": 10740 }, { "epoch": 0.29, "learning_rate": 1.6578454672973397e-05, "loss": 1.3618, "step": 10741 }, { "epoch": 0.29, "learning_rate": 1.657778847805267e-05, "loss": 1.481, "step": 10742 }, { "epoch": 0.29, "learning_rate": 1.6577122231670424e-05, "loss": 1.3374, "step": 10743 }, { "epoch": 0.29, "learning_rate": 1.6576455933831862e-05, "loss": 1.3042, "step": 10744 }, { "epoch": 0.29, "learning_rate": 1.6575789584542202e-05, "loss": 1.1724, "step": 10745 }, { "epoch": 0.29, "learning_rate": 1.6575123183806657e-05, "loss": 1.2917, "step": 10746 }, { "epoch": 0.29, "learning_rate": 1.6574456731630443e-05, "loss": 1.4106, "step": 10747 }, { "epoch": 0.29, "learning_rate": 1.6573790228018765e-05, "loss": 1.3091, "step": 10748 }, { "epoch": 0.29, "learning_rate": 1.657312367297685e-05, "loss": 1.23, "step": 10749 }, { "epoch": 0.29, "learning_rate": 1.6572457066509905e-05, "loss": 1.2961, "step": 10750 }, { "epoch": 0.29, "learning_rate": 1.6571790408623143e-05, "loss": 1.3569, "step": 10751 }, { "epoch": 0.29, "learning_rate": 1.6571123699321786e-05, "loss": 1.4099, "step": 10752 }, { "epoch": 0.29, "learning_rate": 1.6570456938611042e-05, "loss": 1.4263, "step": 10753 }, { "epoch": 0.29, "learning_rate": 1.656979012649614e-05, "loss": 1.479, "step": 10754 }, { "epoch": 0.29, "learning_rate": 1.6569123262982283e-05, "loss": 1.3213, "step": 10755 }, { "epoch": 0.29, "learning_rate": 1.6568456348074697e-05, "loss": 1.4829, "step": 10756 }, { "epoch": 0.29, "learning_rate": 1.6567789381778597e-05, "loss": 1.3235, "step": 10757 }, { "epoch": 0.29, "learning_rate": 1.6567122364099202e-05, "loss": 1.4014, "step": 10758 }, { "epoch": 0.29, "learning_rate": 1.6566455295041733e-05, "loss": 1.3748, "step": 10759 }, { "epoch": 0.29, "learning_rate": 1.65657881746114e-05, "loss": 1.5049, "step": 10760 }, { "epoch": 0.29, "learning_rate": 1.6565121002813433e-05, "loss": 1.3503, "step": 10761 }, { "epoch": 0.29, "learning_rate": 1.6564453779653043e-05, "loss": 1.394, "step": 10762 }, { "epoch": 0.29, "learning_rate": 1.656378650513545e-05, "loss": 1.3831, "step": 10763 }, { "epoch": 0.29, "learning_rate": 1.6563119179265883e-05, "loss": 1.2185, "step": 10764 }, { "epoch": 0.29, "learning_rate": 1.6562451802049557e-05, "loss": 1.3926, "step": 10765 }, { "epoch": 0.29, "learning_rate": 1.6561784373491695e-05, "loss": 1.2578, "step": 10766 }, { "epoch": 0.29, "learning_rate": 1.6561116893597516e-05, "loss": 1.2974, "step": 10767 }, { "epoch": 0.29, "learning_rate": 1.6560449362372244e-05, "loss": 1.4324, "step": 10768 }, { "epoch": 0.29, "learning_rate": 1.65597817798211e-05, "loss": 1.1718, "step": 10769 }, { "epoch": 0.29, "learning_rate": 1.6559114145949307e-05, "loss": 1.2834, "step": 10770 }, { "epoch": 0.29, "learning_rate": 1.655844646076209e-05, "loss": 1.3501, "step": 10771 }, { "epoch": 0.29, "learning_rate": 1.6557778724264675e-05, "loss": 1.417, "step": 10772 }, { "epoch": 0.29, "learning_rate": 1.655711093646228e-05, "loss": 1.3625, "step": 10773 }, { "epoch": 0.29, "learning_rate": 1.6556443097360136e-05, "loss": 1.3513, "step": 10774 }, { "epoch": 0.29, "learning_rate": 1.655577520696346e-05, "loss": 1.3206, "step": 10775 }, { "epoch": 0.29, "learning_rate": 1.6555107265277484e-05, "loss": 1.4541, "step": 10776 }, { "epoch": 0.29, "learning_rate": 1.655443927230743e-05, "loss": 1.4609, "step": 10777 }, { "epoch": 0.29, "learning_rate": 1.6553771228058527e-05, "loss": 1.3876, "step": 10778 }, { "epoch": 0.29, "learning_rate": 1.6553103132535998e-05, "loss": 1.4385, "step": 10779 }, { "epoch": 0.29, "learning_rate": 1.6552434985745072e-05, "loss": 1.3943, "step": 10780 }, { "epoch": 0.29, "learning_rate": 1.6551766787690974e-05, "loss": 1.2761, "step": 10781 }, { "epoch": 0.29, "learning_rate": 1.6551098538378935e-05, "loss": 1.373, "step": 10782 }, { "epoch": 0.29, "learning_rate": 1.6550430237814182e-05, "loss": 1.4375, "step": 10783 }, { "epoch": 0.29, "learning_rate": 1.6549761886001943e-05, "loss": 1.3303, "step": 10784 }, { "epoch": 0.29, "learning_rate": 1.6549093482947447e-05, "loss": 1.3716, "step": 10785 }, { "epoch": 0.29, "learning_rate": 1.6548425028655925e-05, "loss": 1.2427, "step": 10786 }, { "epoch": 0.29, "learning_rate": 1.6547756523132597e-05, "loss": 1.3794, "step": 10787 }, { "epoch": 0.29, "learning_rate": 1.654708796638271e-05, "loss": 1.3687, "step": 10788 }, { "epoch": 0.29, "learning_rate": 1.654641935841148e-05, "loss": 1.4048, "step": 10789 }, { "epoch": 0.29, "learning_rate": 1.654575069922415e-05, "loss": 1.3857, "step": 10790 }, { "epoch": 0.29, "learning_rate": 1.6545081988825937e-05, "loss": 1.2886, "step": 10791 }, { "epoch": 0.29, "learning_rate": 1.6544413227222086e-05, "loss": 1.2588, "step": 10792 }, { "epoch": 0.29, "learning_rate": 1.6543744414417818e-05, "loss": 1.198, "step": 10793 }, { "epoch": 0.29, "learning_rate": 1.6543075550418373e-05, "loss": 1.3481, "step": 10794 }, { "epoch": 0.29, "learning_rate": 1.6542406635228983e-05, "loss": 1.3848, "step": 10795 }, { "epoch": 0.29, "learning_rate": 1.6541737668854877e-05, "loss": 1.1167, "step": 10796 }, { "epoch": 0.29, "learning_rate": 1.6541068651301294e-05, "loss": 1.3796, "step": 10797 }, { "epoch": 0.29, "learning_rate": 1.6540399582573465e-05, "loss": 1.3726, "step": 10798 }, { "epoch": 0.29, "learning_rate": 1.653973046267663e-05, "loss": 1.2456, "step": 10799 }, { "epoch": 0.29, "learning_rate": 1.653906129161601e-05, "loss": 1.4448, "step": 10800 }, { "epoch": 0.29, "learning_rate": 1.6538392069396853e-05, "loss": 1.2712, "step": 10801 }, { "epoch": 0.29, "learning_rate": 1.6537722796024392e-05, "loss": 1.2852, "step": 10802 }, { "epoch": 0.3, "learning_rate": 1.6537053471503864e-05, "loss": 1.1575, "step": 10803 }, { "epoch": 0.3, "learning_rate": 1.65363840958405e-05, "loss": 1.2446, "step": 10804 }, { "epoch": 0.3, "learning_rate": 1.653571466903954e-05, "loss": 1.397, "step": 10805 }, { "epoch": 0.3, "learning_rate": 1.6535045191106225e-05, "loss": 1.1533, "step": 10806 }, { "epoch": 0.3, "learning_rate": 1.653437566204579e-05, "loss": 1.3567, "step": 10807 }, { "epoch": 0.3, "learning_rate": 1.653370608186347e-05, "loss": 1.4138, "step": 10808 }, { "epoch": 0.3, "learning_rate": 1.6533036450564507e-05, "loss": 1.3137, "step": 10809 }, { "epoch": 0.3, "learning_rate": 1.6532366768154137e-05, "loss": 1.4512, "step": 10810 }, { "epoch": 0.3, "learning_rate": 1.6531697034637605e-05, "loss": 1.448, "step": 10811 }, { "epoch": 0.3, "learning_rate": 1.6531027250020143e-05, "loss": 1.2, "step": 10812 }, { "epoch": 0.3, "learning_rate": 1.6530357414306995e-05, "loss": 1.3035, "step": 10813 }, { "epoch": 0.3, "learning_rate": 1.6529687527503405e-05, "loss": 1.3286, "step": 10814 }, { "epoch": 0.3, "learning_rate": 1.652901758961461e-05, "loss": 1.4492, "step": 10815 }, { "epoch": 0.3, "learning_rate": 1.6528347600645846e-05, "loss": 1.1669, "step": 10816 }, { "epoch": 0.3, "learning_rate": 1.6527677560602364e-05, "loss": 1.3625, "step": 10817 }, { "epoch": 0.3, "learning_rate": 1.6527007469489402e-05, "loss": 1.6846, "step": 10818 }, { "epoch": 0.3, "learning_rate": 1.6526337327312202e-05, "loss": 1.3406, "step": 10819 }, { "epoch": 0.3, "learning_rate": 1.6525667134076008e-05, "loss": 1.2556, "step": 10820 }, { "epoch": 0.3, "learning_rate": 1.6524996889786065e-05, "loss": 1.7302, "step": 10821 }, { "epoch": 0.3, "learning_rate": 1.6524326594447612e-05, "loss": 1.2651, "step": 10822 }, { "epoch": 0.3, "learning_rate": 1.65236562480659e-05, "loss": 1.3438, "step": 10823 }, { "epoch": 0.3, "learning_rate": 1.6522985850646166e-05, "loss": 1.1024, "step": 10824 }, { "epoch": 0.3, "learning_rate": 1.6522315402193656e-05, "loss": 1.3008, "step": 10825 }, { "epoch": 0.3, "learning_rate": 1.652164490271362e-05, "loss": 1.4116, "step": 10826 }, { "epoch": 0.3, "learning_rate": 1.6520974352211297e-05, "loss": 1.1477, "step": 10827 }, { "epoch": 0.3, "learning_rate": 1.6520303750691945e-05, "loss": 1.2319, "step": 10828 }, { "epoch": 0.3, "learning_rate": 1.6519633098160795e-05, "loss": 1.3525, "step": 10829 }, { "epoch": 0.3, "learning_rate": 1.6518962394623104e-05, "loss": 1.246, "step": 10830 }, { "epoch": 0.3, "learning_rate": 1.6518291640084116e-05, "loss": 1.4246, "step": 10831 }, { "epoch": 0.3, "learning_rate": 1.6517620834549078e-05, "loss": 1.2952, "step": 10832 }, { "epoch": 0.3, "learning_rate": 1.6516949978023243e-05, "loss": 1.355, "step": 10833 }, { "epoch": 0.3, "learning_rate": 1.6516279070511853e-05, "loss": 1.3076, "step": 10834 }, { "epoch": 0.3, "learning_rate": 1.651560811202016e-05, "loss": 1.426, "step": 10835 }, { "epoch": 0.3, "learning_rate": 1.6514937102553418e-05, "loss": 1.4417, "step": 10836 }, { "epoch": 0.3, "learning_rate": 1.6514266042116866e-05, "loss": 1.2393, "step": 10837 }, { "epoch": 0.3, "learning_rate": 1.651359493071576e-05, "loss": 1.3284, "step": 10838 }, { "epoch": 0.3, "learning_rate": 1.6512923768355352e-05, "loss": 1.2009, "step": 10839 }, { "epoch": 0.3, "learning_rate": 1.6512252555040893e-05, "loss": 1.4146, "step": 10840 }, { "epoch": 0.3, "learning_rate": 1.651158129077763e-05, "loss": 1.2964, "step": 10841 }, { "epoch": 0.3, "learning_rate": 1.6510909975570813e-05, "loss": 1.4458, "step": 10842 }, { "epoch": 0.3, "learning_rate": 1.6510238609425705e-05, "loss": 1.377, "step": 10843 }, { "epoch": 0.3, "learning_rate": 1.650956719234755e-05, "loss": 1.2856, "step": 10844 }, { "epoch": 0.3, "learning_rate": 1.6508895724341597e-05, "loss": 1.3254, "step": 10845 }, { "epoch": 0.3, "learning_rate": 1.650822420541311e-05, "loss": 1.3064, "step": 10846 }, { "epoch": 0.3, "learning_rate": 1.6507552635567336e-05, "loss": 1.333, "step": 10847 }, { "epoch": 0.3, "learning_rate": 1.6506881014809528e-05, "loss": 1.1919, "step": 10848 }, { "epoch": 0.3, "learning_rate": 1.6506209343144942e-05, "loss": 1.2708, "step": 10849 }, { "epoch": 0.3, "learning_rate": 1.650553762057884e-05, "loss": 1.3733, "step": 10850 }, { "epoch": 0.3, "learning_rate": 1.6504865847116464e-05, "loss": 1.3032, "step": 10851 }, { "epoch": 0.3, "learning_rate": 1.650419402276308e-05, "loss": 1.3303, "step": 10852 }, { "epoch": 0.3, "learning_rate": 1.650352214752394e-05, "loss": 1.271, "step": 10853 }, { "epoch": 0.3, "learning_rate": 1.65028502214043e-05, "loss": 1.3743, "step": 10854 }, { "epoch": 0.3, "learning_rate": 1.6502178244409418e-05, "loss": 1.292, "step": 10855 }, { "epoch": 0.3, "learning_rate": 1.650150621654455e-05, "loss": 1.3008, "step": 10856 }, { "epoch": 0.3, "learning_rate": 1.6500834137814953e-05, "loss": 1.2529, "step": 10857 }, { "epoch": 0.3, "learning_rate": 1.6500162008225894e-05, "loss": 1.4668, "step": 10858 }, { "epoch": 0.3, "learning_rate": 1.649948982778262e-05, "loss": 1.4338, "step": 10859 }, { "epoch": 0.3, "learning_rate": 1.649881759649039e-05, "loss": 1.4199, "step": 10860 }, { "epoch": 0.3, "learning_rate": 1.649814531435447e-05, "loss": 1.5229, "step": 10861 }, { "epoch": 0.3, "learning_rate": 1.6497472981380117e-05, "loss": 1.2454, "step": 10862 }, { "epoch": 0.3, "learning_rate": 1.6496800597572587e-05, "loss": 1.4651, "step": 10863 }, { "epoch": 0.3, "learning_rate": 1.6496128162937148e-05, "loss": 1.3708, "step": 10864 }, { "epoch": 0.3, "learning_rate": 1.649545567747906e-05, "loss": 1.4241, "step": 10865 }, { "epoch": 0.3, "learning_rate": 1.6494783141203577e-05, "loss": 1.4609, "step": 10866 }, { "epoch": 0.3, "learning_rate": 1.6494110554115967e-05, "loss": 1.4131, "step": 10867 }, { "epoch": 0.3, "learning_rate": 1.6493437916221487e-05, "loss": 1.3228, "step": 10868 }, { "epoch": 0.3, "learning_rate": 1.6492765227525403e-05, "loss": 1.4385, "step": 10869 }, { "epoch": 0.3, "learning_rate": 1.6492092488032977e-05, "loss": 1.77, "step": 10870 }, { "epoch": 0.3, "learning_rate": 1.6491419697749473e-05, "loss": 1.394, "step": 10871 }, { "epoch": 0.3, "learning_rate": 1.6490746856680155e-05, "loss": 1.2935, "step": 10872 }, { "epoch": 0.3, "learning_rate": 1.6490073964830283e-05, "loss": 1.3787, "step": 10873 }, { "epoch": 0.3, "learning_rate": 1.6489401022205126e-05, "loss": 1.3213, "step": 10874 }, { "epoch": 0.3, "learning_rate": 1.6488728028809945e-05, "loss": 1.4587, "step": 10875 }, { "epoch": 0.3, "learning_rate": 1.6488054984650007e-05, "loss": 1.3499, "step": 10876 }, { "epoch": 0.3, "learning_rate": 1.648738188973058e-05, "loss": 1.2881, "step": 10877 }, { "epoch": 0.3, "learning_rate": 1.648670874405693e-05, "loss": 1.3809, "step": 10878 }, { "epoch": 0.3, "learning_rate": 1.6486035547634312e-05, "loss": 1.3015, "step": 10879 }, { "epoch": 0.3, "learning_rate": 1.648536230046801e-05, "loss": 1.3628, "step": 10880 }, { "epoch": 0.3, "learning_rate": 1.6484689002563282e-05, "loss": 1.4729, "step": 10881 }, { "epoch": 0.3, "learning_rate": 1.6484015653925394e-05, "loss": 1.3752, "step": 10882 }, { "epoch": 0.3, "learning_rate": 1.6483342254559618e-05, "loss": 1.7021, "step": 10883 }, { "epoch": 0.3, "learning_rate": 1.6482668804471222e-05, "loss": 1.4197, "step": 10884 }, { "epoch": 0.3, "learning_rate": 1.648199530366547e-05, "loss": 1.3611, "step": 10885 }, { "epoch": 0.3, "learning_rate": 1.6481321752147637e-05, "loss": 1.4004, "step": 10886 }, { "epoch": 0.3, "learning_rate": 1.6480648149922993e-05, "loss": 1.4961, "step": 10887 }, { "epoch": 0.3, "learning_rate": 1.64799744969968e-05, "loss": 1.3367, "step": 10888 }, { "epoch": 0.3, "learning_rate": 1.647930079337434e-05, "loss": 1.248, "step": 10889 }, { "epoch": 0.3, "learning_rate": 1.6478627039060872e-05, "loss": 1.3718, "step": 10890 }, { "epoch": 0.3, "learning_rate": 1.6477953234061673e-05, "loss": 1.3508, "step": 10891 }, { "epoch": 0.3, "learning_rate": 1.6477279378382016e-05, "loss": 1.3606, "step": 10892 }, { "epoch": 0.3, "learning_rate": 1.6476605472027173e-05, "loss": 1.4194, "step": 10893 }, { "epoch": 0.3, "learning_rate": 1.647593151500241e-05, "loss": 1.3569, "step": 10894 }, { "epoch": 0.3, "learning_rate": 1.6475257507313003e-05, "loss": 1.2849, "step": 10895 }, { "epoch": 0.3, "learning_rate": 1.647458344896423e-05, "loss": 1.4258, "step": 10896 }, { "epoch": 0.3, "learning_rate": 1.647390933996136e-05, "loss": 1.2427, "step": 10897 }, { "epoch": 0.3, "learning_rate": 1.6473235180309664e-05, "loss": 1.2625, "step": 10898 }, { "epoch": 0.3, "learning_rate": 1.6472560970014423e-05, "loss": 1.2874, "step": 10899 }, { "epoch": 0.3, "learning_rate": 1.647188670908091e-05, "loss": 1.2307, "step": 10900 }, { "epoch": 0.3, "learning_rate": 1.6471212397514397e-05, "loss": 1.3186, "step": 10901 }, { "epoch": 0.3, "learning_rate": 1.647053803532016e-05, "loss": 1.323, "step": 10902 }, { "epoch": 0.3, "learning_rate": 1.6469863622503478e-05, "loss": 1.261, "step": 10903 }, { "epoch": 0.3, "learning_rate": 1.6469189159069624e-05, "loss": 1.4766, "step": 10904 }, { "epoch": 0.3, "learning_rate": 1.6468514645023875e-05, "loss": 1.4268, "step": 10905 }, { "epoch": 0.3, "learning_rate": 1.6467840080371512e-05, "loss": 1.1589, "step": 10906 }, { "epoch": 0.3, "learning_rate": 1.646716546511781e-05, "loss": 1.479, "step": 10907 }, { "epoch": 0.3, "learning_rate": 1.6466490799268046e-05, "loss": 1.3718, "step": 10908 }, { "epoch": 0.3, "learning_rate": 1.6465816082827494e-05, "loss": 1.2534, "step": 10909 }, { "epoch": 0.3, "learning_rate": 1.646514131580144e-05, "loss": 1.3228, "step": 10910 }, { "epoch": 0.3, "learning_rate": 1.6464466498195166e-05, "loss": 1.3999, "step": 10911 }, { "epoch": 0.3, "learning_rate": 1.646379163001394e-05, "loss": 1.3599, "step": 10912 }, { "epoch": 0.3, "learning_rate": 1.6463116711263048e-05, "loss": 1.3376, "step": 10913 }, { "epoch": 0.3, "learning_rate": 1.6462441741947772e-05, "loss": 1.2532, "step": 10914 }, { "epoch": 0.3, "learning_rate": 1.6461766722073388e-05, "loss": 1.1121, "step": 10915 }, { "epoch": 0.3, "learning_rate": 1.6461091651645183e-05, "loss": 1.2236, "step": 10916 }, { "epoch": 0.3, "learning_rate": 1.646041653066843e-05, "loss": 1.2742, "step": 10917 }, { "epoch": 0.3, "learning_rate": 1.6459741359148424e-05, "loss": 1.364, "step": 10918 }, { "epoch": 0.3, "learning_rate": 1.6459066137090433e-05, "loss": 1.3638, "step": 10919 }, { "epoch": 0.3, "learning_rate": 1.645839086449975e-05, "loss": 1.1782, "step": 10920 }, { "epoch": 0.3, "learning_rate": 1.645771554138165e-05, "loss": 1.4163, "step": 10921 }, { "epoch": 0.3, "learning_rate": 1.6457040167741422e-05, "loss": 1.4268, "step": 10922 }, { "epoch": 0.3, "learning_rate": 1.645636474358435e-05, "loss": 1.2498, "step": 10923 }, { "epoch": 0.3, "learning_rate": 1.6455689268915714e-05, "loss": 1.3555, "step": 10924 }, { "epoch": 0.3, "learning_rate": 1.6455013743740796e-05, "loss": 1.2378, "step": 10925 }, { "epoch": 0.3, "learning_rate": 1.6454338168064893e-05, "loss": 1.3132, "step": 10926 }, { "epoch": 0.3, "learning_rate": 1.645366254189328e-05, "loss": 1.3286, "step": 10927 }, { "epoch": 0.3, "learning_rate": 1.645298686523125e-05, "loss": 1.4277, "step": 10928 }, { "epoch": 0.3, "learning_rate": 1.6452311138084082e-05, "loss": 1.3323, "step": 10929 }, { "epoch": 0.3, "learning_rate": 1.6451635360457065e-05, "loss": 1.3716, "step": 10930 }, { "epoch": 0.3, "learning_rate": 1.6450959532355488e-05, "loss": 1.1978, "step": 10931 }, { "epoch": 0.3, "learning_rate": 1.6450283653784634e-05, "loss": 1.3794, "step": 10932 }, { "epoch": 0.3, "learning_rate": 1.6449607724749797e-05, "loss": 1.1152, "step": 10933 }, { "epoch": 0.3, "learning_rate": 1.6448931745256263e-05, "loss": 1.2803, "step": 10934 }, { "epoch": 0.3, "learning_rate": 1.644825571530932e-05, "loss": 1.4844, "step": 10935 }, { "epoch": 0.3, "learning_rate": 1.644757963491425e-05, "loss": 1.2627, "step": 10936 }, { "epoch": 0.3, "learning_rate": 1.6446903504076356e-05, "loss": 1.4634, "step": 10937 }, { "epoch": 0.3, "learning_rate": 1.6446227322800918e-05, "loss": 1.3215, "step": 10938 }, { "epoch": 0.3, "learning_rate": 1.6445551091093226e-05, "loss": 1.344, "step": 10939 }, { "epoch": 0.3, "learning_rate": 1.6444874808958577e-05, "loss": 1.4761, "step": 10940 }, { "epoch": 0.3, "learning_rate": 1.644419847640226e-05, "loss": 1.499, "step": 10941 }, { "epoch": 0.3, "learning_rate": 1.6443522093429556e-05, "loss": 1.2217, "step": 10942 }, { "epoch": 0.3, "learning_rate": 1.6442845660045773e-05, "loss": 1.3379, "step": 10943 }, { "epoch": 0.3, "learning_rate": 1.644216917625619e-05, "loss": 1.1812, "step": 10944 }, { "epoch": 0.3, "learning_rate": 1.644149264206611e-05, "loss": 1.2764, "step": 10945 }, { "epoch": 0.3, "learning_rate": 1.6440816057480815e-05, "loss": 1.3694, "step": 10946 }, { "epoch": 0.3, "learning_rate": 1.6440139422505606e-05, "loss": 1.4182, "step": 10947 }, { "epoch": 0.3, "learning_rate": 1.6439462737145777e-05, "loss": 1.3992, "step": 10948 }, { "epoch": 0.3, "learning_rate": 1.6438786001406618e-05, "loss": 1.4041, "step": 10949 }, { "epoch": 0.3, "learning_rate": 1.6438109215293426e-05, "loss": 1.2458, "step": 10950 }, { "epoch": 0.3, "learning_rate": 1.6437432378811495e-05, "loss": 1.3547, "step": 10951 }, { "epoch": 0.3, "learning_rate": 1.6436755491966116e-05, "loss": 1.2688, "step": 10952 }, { "epoch": 0.3, "learning_rate": 1.6436078554762592e-05, "loss": 1.3804, "step": 10953 }, { "epoch": 0.3, "learning_rate": 1.6435401567206216e-05, "loss": 1.2891, "step": 10954 }, { "epoch": 0.3, "learning_rate": 1.6434724529302282e-05, "loss": 1.429, "step": 10955 }, { "epoch": 0.3, "learning_rate": 1.643404744105609e-05, "loss": 1.3979, "step": 10956 }, { "epoch": 0.3, "learning_rate": 1.6433370302472937e-05, "loss": 1.5186, "step": 10957 }, { "epoch": 0.3, "learning_rate": 1.643269311355812e-05, "loss": 1.4072, "step": 10958 }, { "epoch": 0.3, "learning_rate": 1.6432015874316934e-05, "loss": 1.2834, "step": 10959 }, { "epoch": 0.3, "learning_rate": 1.6431338584754684e-05, "loss": 1.3374, "step": 10960 }, { "epoch": 0.3, "learning_rate": 1.6430661244876668e-05, "loss": 1.3062, "step": 10961 }, { "epoch": 0.3, "learning_rate": 1.6429983854688177e-05, "loss": 1.3062, "step": 10962 }, { "epoch": 0.3, "learning_rate": 1.6429306414194515e-05, "loss": 1.3796, "step": 10963 }, { "epoch": 0.3, "learning_rate": 1.6428628923400988e-05, "loss": 1.303, "step": 10964 }, { "epoch": 0.3, "learning_rate": 1.642795138231289e-05, "loss": 1.4482, "step": 10965 }, { "epoch": 0.3, "learning_rate": 1.642727379093552e-05, "loss": 1.0167, "step": 10966 }, { "epoch": 0.3, "learning_rate": 1.6426596149274187e-05, "loss": 1.4514, "step": 10967 }, { "epoch": 0.3, "learning_rate": 1.6425918457334183e-05, "loss": 1.4319, "step": 10968 }, { "epoch": 0.3, "learning_rate": 1.6425240715120816e-05, "loss": 1.1726, "step": 10969 }, { "epoch": 0.3, "learning_rate": 1.6424562922639387e-05, "loss": 1.1914, "step": 10970 }, { "epoch": 0.3, "learning_rate": 1.64238850798952e-05, "loss": 1.5, "step": 10971 }, { "epoch": 0.3, "learning_rate": 1.6423207186893556e-05, "loss": 1.293, "step": 10972 }, { "epoch": 0.3, "learning_rate": 1.642252924363976e-05, "loss": 1.3914, "step": 10973 }, { "epoch": 0.3, "learning_rate": 1.6421851250139114e-05, "loss": 1.502, "step": 10974 }, { "epoch": 0.3, "learning_rate": 1.6421173206396926e-05, "loss": 1.6514, "step": 10975 }, { "epoch": 0.3, "learning_rate": 1.6420495112418497e-05, "loss": 1.283, "step": 10976 }, { "epoch": 0.3, "learning_rate": 1.641981696820913e-05, "loss": 1.2495, "step": 10977 }, { "epoch": 0.3, "learning_rate": 1.6419138773774136e-05, "loss": 1.3921, "step": 10978 }, { "epoch": 0.3, "learning_rate": 1.641846052911882e-05, "loss": 1.4399, "step": 10979 }, { "epoch": 0.3, "learning_rate": 1.6417782234248488e-05, "loss": 1.2185, "step": 10980 }, { "epoch": 0.3, "learning_rate": 1.6417103889168443e-05, "loss": 1.4004, "step": 10981 }, { "epoch": 0.3, "learning_rate": 1.6416425493883996e-05, "loss": 1.3218, "step": 10982 }, { "epoch": 0.3, "learning_rate": 1.6415747048400453e-05, "loss": 1.2114, "step": 10983 }, { "epoch": 0.3, "learning_rate": 1.6415068552723124e-05, "loss": 1.3015, "step": 10984 }, { "epoch": 0.3, "learning_rate": 1.6414390006857314e-05, "loss": 1.1157, "step": 10985 }, { "epoch": 0.3, "learning_rate": 1.6413711410808332e-05, "loss": 1.1187, "step": 10986 }, { "epoch": 0.3, "learning_rate": 1.6413032764581487e-05, "loss": 1.2913, "step": 10987 }, { "epoch": 0.3, "learning_rate": 1.641235406818209e-05, "loss": 1.1987, "step": 10988 }, { "epoch": 0.3, "learning_rate": 1.641167532161545e-05, "loss": 1.4458, "step": 10989 }, { "epoch": 0.3, "learning_rate": 1.6410996524886878e-05, "loss": 1.3354, "step": 10990 }, { "epoch": 0.3, "learning_rate": 1.6410317678001682e-05, "loss": 1.271, "step": 10991 }, { "epoch": 0.3, "learning_rate": 1.6409638780965177e-05, "loss": 1.4475, "step": 10992 }, { "epoch": 0.3, "learning_rate": 1.6408959833782668e-05, "loss": 1.3459, "step": 10993 }, { "epoch": 0.3, "learning_rate": 1.6408280836459474e-05, "loss": 1.4219, "step": 10994 }, { "epoch": 0.3, "learning_rate": 1.6407601789000905e-05, "loss": 1.3313, "step": 10995 }, { "epoch": 0.3, "learning_rate": 1.6406922691412274e-05, "loss": 1.291, "step": 10996 }, { "epoch": 0.3, "learning_rate": 1.6406243543698892e-05, "loss": 1.344, "step": 10997 }, { "epoch": 0.3, "learning_rate": 1.6405564345866072e-05, "loss": 1.3357, "step": 10998 }, { "epoch": 0.3, "learning_rate": 1.6404885097919128e-05, "loss": 1.4097, "step": 10999 }, { "epoch": 0.3, "learning_rate": 1.6404205799863375e-05, "loss": 1.4204, "step": 11000 }, { "epoch": 0.3, "learning_rate": 1.640352645170413e-05, "loss": 1.3406, "step": 11001 }, { "epoch": 0.3, "learning_rate": 1.6402847053446698e-05, "loss": 1.2742, "step": 11002 }, { "epoch": 0.3, "learning_rate": 1.6402167605096407e-05, "loss": 1.3224, "step": 11003 }, { "epoch": 0.3, "learning_rate": 1.6401488106658568e-05, "loss": 1.5483, "step": 11004 }, { "epoch": 0.3, "learning_rate": 1.6400808558138492e-05, "loss": 1.3594, "step": 11005 }, { "epoch": 0.3, "learning_rate": 1.6400128959541504e-05, "loss": 1.2646, "step": 11006 }, { "epoch": 0.3, "learning_rate": 1.6399449310872914e-05, "loss": 1.342, "step": 11007 }, { "epoch": 0.3, "learning_rate": 1.6398769612138044e-05, "loss": 1.2747, "step": 11008 }, { "epoch": 0.3, "learning_rate": 1.6398089863342205e-05, "loss": 1.3564, "step": 11009 }, { "epoch": 0.3, "learning_rate": 1.6397410064490724e-05, "loss": 1.2759, "step": 11010 }, { "epoch": 0.3, "learning_rate": 1.6396730215588913e-05, "loss": 1.2732, "step": 11011 }, { "epoch": 0.3, "learning_rate": 1.6396050316642095e-05, "loss": 1.3652, "step": 11012 }, { "epoch": 0.3, "learning_rate": 1.6395370367655586e-05, "loss": 1.2571, "step": 11013 }, { "epoch": 0.3, "learning_rate": 1.6394690368634705e-05, "loss": 1.2275, "step": 11014 }, { "epoch": 0.3, "learning_rate": 1.6394010319584775e-05, "loss": 1.5439, "step": 11015 }, { "epoch": 0.3, "learning_rate": 1.6393330220511116e-05, "loss": 1.3215, "step": 11016 }, { "epoch": 0.3, "learning_rate": 1.6392650071419046e-05, "loss": 1.3884, "step": 11017 }, { "epoch": 0.3, "learning_rate": 1.6391969872313886e-05, "loss": 1.2573, "step": 11018 }, { "epoch": 0.3, "learning_rate": 1.639128962320096e-05, "loss": 1.1855, "step": 11019 }, { "epoch": 0.3, "learning_rate": 1.639060932408559e-05, "loss": 1.3174, "step": 11020 }, { "epoch": 0.3, "learning_rate": 1.63899289749731e-05, "loss": 1.3918, "step": 11021 }, { "epoch": 0.3, "learning_rate": 1.6389248575868807e-05, "loss": 1.1643, "step": 11022 }, { "epoch": 0.3, "learning_rate": 1.638856812677804e-05, "loss": 1.3906, "step": 11023 }, { "epoch": 0.3, "learning_rate": 1.638788762770612e-05, "loss": 1.2585, "step": 11024 }, { "epoch": 0.3, "learning_rate": 1.638720707865837e-05, "loss": 1.2947, "step": 11025 }, { "epoch": 0.3, "learning_rate": 1.6386526479640115e-05, "loss": 1.4141, "step": 11026 }, { "epoch": 0.3, "learning_rate": 1.638584583065668e-05, "loss": 1.4624, "step": 11027 }, { "epoch": 0.3, "learning_rate": 1.6385165131713394e-05, "loss": 1.2104, "step": 11028 }, { "epoch": 0.3, "learning_rate": 1.6384484382815573e-05, "loss": 1.4048, "step": 11029 }, { "epoch": 0.3, "learning_rate": 1.638380358396855e-05, "loss": 1.7593, "step": 11030 }, { "epoch": 0.3, "learning_rate": 1.6383122735177655e-05, "loss": 1.3994, "step": 11031 }, { "epoch": 0.3, "learning_rate": 1.6382441836448203e-05, "loss": 1.2908, "step": 11032 }, { "epoch": 0.3, "learning_rate": 1.638176088778553e-05, "loss": 1.7139, "step": 11033 }, { "epoch": 0.3, "learning_rate": 1.6381079889194958e-05, "loss": 1.3574, "step": 11034 }, { "epoch": 0.3, "learning_rate": 1.638039884068182e-05, "loss": 1.2947, "step": 11035 }, { "epoch": 0.3, "learning_rate": 1.637971774225144e-05, "loss": 1.3779, "step": 11036 }, { "epoch": 0.3, "learning_rate": 1.637903659390915e-05, "loss": 1.2944, "step": 11037 }, { "epoch": 0.3, "learning_rate": 1.6378355395660276e-05, "loss": 1.2563, "step": 11038 }, { "epoch": 0.3, "learning_rate": 1.637767414751015e-05, "loss": 1.3628, "step": 11039 }, { "epoch": 0.3, "learning_rate": 1.63769928494641e-05, "loss": 1.248, "step": 11040 }, { "epoch": 0.3, "learning_rate": 1.6376311501527457e-05, "loss": 1.5413, "step": 11041 }, { "epoch": 0.3, "learning_rate": 1.637563010370555e-05, "loss": 1.3787, "step": 11042 }, { "epoch": 0.3, "learning_rate": 1.6374948656003713e-05, "loss": 1.5625, "step": 11043 }, { "epoch": 0.3, "learning_rate": 1.6374267158427274e-05, "loss": 1.2319, "step": 11044 }, { "epoch": 0.3, "learning_rate": 1.6373585610981562e-05, "loss": 1.4065, "step": 11045 }, { "epoch": 0.3, "learning_rate": 1.6372904013671923e-05, "loss": 1.394, "step": 11046 }, { "epoch": 0.3, "learning_rate": 1.6372222366503674e-05, "loss": 1.1553, "step": 11047 }, { "epoch": 0.3, "learning_rate": 1.6371540669482153e-05, "loss": 1.291, "step": 11048 }, { "epoch": 0.3, "learning_rate": 1.6370858922612692e-05, "loss": 1.3823, "step": 11049 }, { "epoch": 0.3, "learning_rate": 1.637017712590063e-05, "loss": 1.3545, "step": 11050 }, { "epoch": 0.3, "learning_rate": 1.6369495279351296e-05, "loss": 1.3086, "step": 11051 }, { "epoch": 0.3, "learning_rate": 1.6368813382970027e-05, "loss": 1.5564, "step": 11052 }, { "epoch": 0.3, "learning_rate": 1.636813143676216e-05, "loss": 1.2725, "step": 11053 }, { "epoch": 0.3, "learning_rate": 1.6367449440733024e-05, "loss": 1.2427, "step": 11054 }, { "epoch": 0.3, "learning_rate": 1.6366767394887956e-05, "loss": 1.4089, "step": 11055 }, { "epoch": 0.3, "learning_rate": 1.6366085299232296e-05, "loss": 1.5439, "step": 11056 }, { "epoch": 0.3, "learning_rate": 1.636540315377138e-05, "loss": 1.2129, "step": 11057 }, { "epoch": 0.3, "learning_rate": 1.6364720958510537e-05, "loss": 1.2856, "step": 11058 }, { "epoch": 0.3, "learning_rate": 1.6364038713455118e-05, "loss": 1.3259, "step": 11059 }, { "epoch": 0.3, "learning_rate": 1.6363356418610448e-05, "loss": 1.4563, "step": 11060 }, { "epoch": 0.3, "learning_rate": 1.636267407398187e-05, "loss": 1.3289, "step": 11061 }, { "epoch": 0.3, "learning_rate": 1.6361991679574722e-05, "loss": 1.4226, "step": 11062 }, { "epoch": 0.3, "learning_rate": 1.6361309235394342e-05, "loss": 1.282, "step": 11063 }, { "epoch": 0.3, "learning_rate": 1.6360626741446074e-05, "loss": 1.2493, "step": 11064 }, { "epoch": 0.3, "learning_rate": 1.6359944197735247e-05, "loss": 1.1934, "step": 11065 }, { "epoch": 0.3, "learning_rate": 1.635926160426721e-05, "loss": 1.3965, "step": 11066 }, { "epoch": 0.3, "learning_rate": 1.63585789610473e-05, "loss": 1.2739, "step": 11067 }, { "epoch": 0.3, "learning_rate": 1.635789626808086e-05, "loss": 1.3962, "step": 11068 }, { "epoch": 0.3, "learning_rate": 1.6357213525373228e-05, "loss": 1.3003, "step": 11069 }, { "epoch": 0.3, "learning_rate": 1.635653073292975e-05, "loss": 1.2563, "step": 11070 }, { "epoch": 0.3, "learning_rate": 1.635584789075576e-05, "loss": 1.4253, "step": 11071 }, { "epoch": 0.3, "learning_rate": 1.6355164998856604e-05, "loss": 1.4053, "step": 11072 }, { "epoch": 0.3, "learning_rate": 1.635448205723763e-05, "loss": 1.3716, "step": 11073 }, { "epoch": 0.3, "learning_rate": 1.6353799065904174e-05, "loss": 1.3994, "step": 11074 }, { "epoch": 0.3, "learning_rate": 1.6353116024861584e-05, "loss": 1.1733, "step": 11075 }, { "epoch": 0.3, "learning_rate": 1.6352432934115202e-05, "loss": 1.395, "step": 11076 }, { "epoch": 0.3, "learning_rate": 1.635174979367037e-05, "loss": 1.259, "step": 11077 }, { "epoch": 0.3, "learning_rate": 1.6351066603532432e-05, "loss": 1.3967, "step": 11078 }, { "epoch": 0.3, "learning_rate": 1.6350383363706737e-05, "loss": 1.3618, "step": 11079 }, { "epoch": 0.3, "learning_rate": 1.634970007419863e-05, "loss": 1.2705, "step": 11080 }, { "epoch": 0.3, "learning_rate": 1.6349016735013456e-05, "loss": 1.3877, "step": 11081 }, { "epoch": 0.3, "learning_rate": 1.634833334615656e-05, "loss": 1.1995, "step": 11082 }, { "epoch": 0.3, "learning_rate": 1.634764990763329e-05, "loss": 1.2505, "step": 11083 }, { "epoch": 0.3, "learning_rate": 1.634696641944899e-05, "loss": 1.3428, "step": 11084 }, { "epoch": 0.3, "learning_rate": 1.634628288160901e-05, "loss": 1.3943, "step": 11085 }, { "epoch": 0.3, "learning_rate": 1.6345599294118698e-05, "loss": 1.3003, "step": 11086 }, { "epoch": 0.3, "learning_rate": 1.6344915656983397e-05, "loss": 1.3293, "step": 11087 }, { "epoch": 0.3, "learning_rate": 1.6344231970208465e-05, "loss": 1.3062, "step": 11088 }, { "epoch": 0.3, "learning_rate": 1.634354823379924e-05, "loss": 1.262, "step": 11089 }, { "epoch": 0.3, "learning_rate": 1.634286444776108e-05, "loss": 1.3123, "step": 11090 }, { "epoch": 0.3, "learning_rate": 1.634218061209933e-05, "loss": 1.4719, "step": 11091 }, { "epoch": 0.3, "learning_rate": 1.6341496726819343e-05, "loss": 1.332, "step": 11092 }, { "epoch": 0.3, "learning_rate": 1.6340812791926465e-05, "loss": 1.3782, "step": 11093 }, { "epoch": 0.3, "learning_rate": 1.634012880742605e-05, "loss": 1.207, "step": 11094 }, { "epoch": 0.3, "learning_rate": 1.633944477332345e-05, "loss": 1.3569, "step": 11095 }, { "epoch": 0.3, "learning_rate": 1.6338760689624014e-05, "loss": 1.3376, "step": 11096 }, { "epoch": 0.3, "learning_rate": 1.6338076556333096e-05, "loss": 1.4246, "step": 11097 }, { "epoch": 0.3, "learning_rate": 1.6337392373456046e-05, "loss": 1.4214, "step": 11098 }, { "epoch": 0.3, "learning_rate": 1.633670814099822e-05, "loss": 1.2241, "step": 11099 }, { "epoch": 0.3, "learning_rate": 1.6336023858964965e-05, "loss": 1.2542, "step": 11100 }, { "epoch": 0.3, "learning_rate": 1.6335339527361645e-05, "loss": 1.3252, "step": 11101 }, { "epoch": 0.3, "learning_rate": 1.6334655146193602e-05, "loss": 1.2856, "step": 11102 }, { "epoch": 0.3, "learning_rate": 1.6333970715466197e-05, "loss": 1.1409, "step": 11103 }, { "epoch": 0.3, "learning_rate": 1.633328623518479e-05, "loss": 1.2939, "step": 11104 }, { "epoch": 0.3, "learning_rate": 1.6332601705354723e-05, "loss": 1.3315, "step": 11105 }, { "epoch": 0.3, "learning_rate": 1.6331917125981357e-05, "loss": 1.3511, "step": 11106 }, { "epoch": 0.3, "learning_rate": 1.6331232497070055e-05, "loss": 1.2314, "step": 11107 }, { "epoch": 0.3, "learning_rate": 1.633054781862616e-05, "loss": 1.2842, "step": 11108 }, { "epoch": 0.3, "learning_rate": 1.6329863090655043e-05, "loss": 1.1157, "step": 11109 }, { "epoch": 0.3, "learning_rate": 1.632917831316205e-05, "loss": 1.3052, "step": 11110 }, { "epoch": 0.3, "learning_rate": 1.632849348615254e-05, "loss": 1.2417, "step": 11111 }, { "epoch": 0.3, "learning_rate": 1.6327808609631874e-05, "loss": 1.3459, "step": 11112 }, { "epoch": 0.3, "learning_rate": 1.632712368360541e-05, "loss": 1.3672, "step": 11113 }, { "epoch": 0.3, "learning_rate": 1.6326438708078508e-05, "loss": 1.2263, "step": 11114 }, { "epoch": 0.3, "learning_rate": 1.632575368305652e-05, "loss": 1.3662, "step": 11115 }, { "epoch": 0.3, "learning_rate": 1.632506860854481e-05, "loss": 1.3867, "step": 11116 }, { "epoch": 0.3, "learning_rate": 1.632438348454874e-05, "loss": 1.5615, "step": 11117 }, { "epoch": 0.3, "learning_rate": 1.632369831107367e-05, "loss": 1.2991, "step": 11118 }, { "epoch": 0.3, "learning_rate": 1.6323013088124954e-05, "loss": 1.5662, "step": 11119 }, { "epoch": 0.3, "learning_rate": 1.6322327815707953e-05, "loss": 1.3062, "step": 11120 }, { "epoch": 0.3, "learning_rate": 1.632164249382804e-05, "loss": 1.5029, "step": 11121 }, { "epoch": 0.3, "learning_rate": 1.6320957122490564e-05, "loss": 1.3069, "step": 11122 }, { "epoch": 0.3, "learning_rate": 1.6320271701700895e-05, "loss": 1.2861, "step": 11123 }, { "epoch": 0.3, "learning_rate": 1.631958623146439e-05, "loss": 1.3784, "step": 11124 }, { "epoch": 0.3, "learning_rate": 1.6318900711786414e-05, "loss": 1.2644, "step": 11125 }, { "epoch": 0.3, "learning_rate": 1.6318215142672332e-05, "loss": 1.1958, "step": 11126 }, { "epoch": 0.3, "learning_rate": 1.63175295241275e-05, "loss": 1.1553, "step": 11127 }, { "epoch": 0.3, "learning_rate": 1.6316843856157295e-05, "loss": 1.4197, "step": 11128 }, { "epoch": 0.3, "learning_rate": 1.631615813876707e-05, "loss": 1.2949, "step": 11129 }, { "epoch": 0.3, "learning_rate": 1.6315472371962196e-05, "loss": 1.4058, "step": 11130 }, { "epoch": 0.3, "learning_rate": 1.6314786555748034e-05, "loss": 1.3853, "step": 11131 }, { "epoch": 0.3, "learning_rate": 1.6314100690129953e-05, "loss": 1.4287, "step": 11132 }, { "epoch": 0.3, "learning_rate": 1.6313414775113318e-05, "loss": 1.2405, "step": 11133 }, { "epoch": 0.3, "learning_rate": 1.6312728810703495e-05, "loss": 1.1312, "step": 11134 }, { "epoch": 0.3, "learning_rate": 1.6312042796905846e-05, "loss": 1.3469, "step": 11135 }, { "epoch": 0.3, "learning_rate": 1.6311356733725744e-05, "loss": 1.175, "step": 11136 }, { "epoch": 0.3, "learning_rate": 1.6310670621168557e-05, "loss": 1.5178, "step": 11137 }, { "epoch": 0.3, "learning_rate": 1.630998445923965e-05, "loss": 1.3391, "step": 11138 }, { "epoch": 0.3, "learning_rate": 1.6309298247944387e-05, "loss": 1.251, "step": 11139 }, { "epoch": 0.3, "learning_rate": 1.6308611987288147e-05, "loss": 1.4021, "step": 11140 }, { "epoch": 0.3, "learning_rate": 1.630792567727629e-05, "loss": 1.2698, "step": 11141 }, { "epoch": 0.3, "learning_rate": 1.630723931791419e-05, "loss": 1.2649, "step": 11142 }, { "epoch": 0.3, "learning_rate": 1.6306552909207215e-05, "loss": 1.2197, "step": 11143 }, { "epoch": 0.3, "learning_rate": 1.6305866451160735e-05, "loss": 1.3904, "step": 11144 }, { "epoch": 0.3, "learning_rate": 1.6305179943780122e-05, "loss": 1.2129, "step": 11145 }, { "epoch": 0.3, "learning_rate": 1.6304493387070747e-05, "loss": 1.5151, "step": 11146 }, { "epoch": 0.3, "learning_rate": 1.6303806781037982e-05, "loss": 1.4524, "step": 11147 }, { "epoch": 0.3, "learning_rate": 1.6303120125687195e-05, "loss": 1.3159, "step": 11148 }, { "epoch": 0.3, "learning_rate": 1.630243342102376e-05, "loss": 1.4226, "step": 11149 }, { "epoch": 0.3, "learning_rate": 1.6301746667053048e-05, "loss": 1.1721, "step": 11150 }, { "epoch": 0.3, "learning_rate": 1.6301059863780432e-05, "loss": 1.2124, "step": 11151 }, { "epoch": 0.3, "learning_rate": 1.630037301121129e-05, "loss": 1.3467, "step": 11152 }, { "epoch": 0.3, "learning_rate": 1.6299686109350996e-05, "loss": 1.5171, "step": 11153 }, { "epoch": 0.3, "learning_rate": 1.6298999158204912e-05, "loss": 1.29, "step": 11154 }, { "epoch": 0.3, "learning_rate": 1.6298312157778425e-05, "loss": 1.3347, "step": 11155 }, { "epoch": 0.3, "learning_rate": 1.6297625108076904e-05, "loss": 1.3657, "step": 11156 }, { "epoch": 0.3, "learning_rate": 1.6296938009105727e-05, "loss": 1.4497, "step": 11157 }, { "epoch": 0.3, "learning_rate": 1.6296250860870266e-05, "loss": 1.4211, "step": 11158 }, { "epoch": 0.3, "learning_rate": 1.6295563663375898e-05, "loss": 1.4111, "step": 11159 }, { "epoch": 0.3, "learning_rate": 1.6294876416628002e-05, "loss": 1.3105, "step": 11160 }, { "epoch": 0.3, "learning_rate": 1.6294189120631956e-05, "loss": 1.3896, "step": 11161 }, { "epoch": 0.3, "learning_rate": 1.6293501775393132e-05, "loss": 1.3774, "step": 11162 }, { "epoch": 0.3, "learning_rate": 1.629281438091691e-05, "loss": 1.2881, "step": 11163 }, { "epoch": 0.3, "learning_rate": 1.6292126937208665e-05, "loss": 1.2666, "step": 11164 }, { "epoch": 0.3, "learning_rate": 1.6291439444273776e-05, "loss": 1.4062, "step": 11165 }, { "epoch": 0.3, "learning_rate": 1.6290751902117627e-05, "loss": 1.4263, "step": 11166 }, { "epoch": 0.3, "learning_rate": 1.6290064310745594e-05, "loss": 1.3992, "step": 11167 }, { "epoch": 0.3, "learning_rate": 1.628937667016305e-05, "loss": 1.2551, "step": 11168 }, { "epoch": 0.31, "learning_rate": 1.6288688980375387e-05, "loss": 1.3035, "step": 11169 }, { "epoch": 0.31, "learning_rate": 1.6288001241387978e-05, "loss": 1.2461, "step": 11170 }, { "epoch": 0.31, "learning_rate": 1.62873134532062e-05, "loss": 1.4807, "step": 11171 }, { "epoch": 0.31, "learning_rate": 1.628662561583544e-05, "loss": 1.5078, "step": 11172 }, { "epoch": 0.31, "learning_rate": 1.6285937729281074e-05, "loss": 1.3923, "step": 11173 }, { "epoch": 0.31, "learning_rate": 1.6285249793548494e-05, "loss": 1.458, "step": 11174 }, { "epoch": 0.31, "learning_rate": 1.6284561808643073e-05, "loss": 1.4697, "step": 11175 }, { "epoch": 0.31, "learning_rate": 1.628387377457019e-05, "loss": 1.3589, "step": 11176 }, { "epoch": 0.31, "learning_rate": 1.6283185691335236e-05, "loss": 1.2192, "step": 11177 }, { "epoch": 0.31, "learning_rate": 1.6282497558943595e-05, "loss": 1.2573, "step": 11178 }, { "epoch": 0.31, "learning_rate": 1.6281809377400648e-05, "loss": 1.4373, "step": 11179 }, { "epoch": 0.31, "learning_rate": 1.6281121146711775e-05, "loss": 1.2341, "step": 11180 }, { "epoch": 0.31, "learning_rate": 1.6280432866882367e-05, "loss": 1.4412, "step": 11181 }, { "epoch": 0.31, "learning_rate": 1.62797445379178e-05, "loss": 1.4067, "step": 11182 }, { "epoch": 0.31, "learning_rate": 1.627905615982347e-05, "loss": 1.3496, "step": 11183 }, { "epoch": 0.31, "learning_rate": 1.6278367732604755e-05, "loss": 1.5156, "step": 11184 }, { "epoch": 0.31, "learning_rate": 1.6277679256267044e-05, "loss": 1.7534, "step": 11185 }, { "epoch": 0.31, "learning_rate": 1.6276990730815723e-05, "loss": 1.2527, "step": 11186 }, { "epoch": 0.31, "learning_rate": 1.6276302156256173e-05, "loss": 1.4785, "step": 11187 }, { "epoch": 0.31, "learning_rate": 1.627561353259379e-05, "loss": 1.281, "step": 11188 }, { "epoch": 0.31, "learning_rate": 1.627492485983396e-05, "loss": 1.3564, "step": 11189 }, { "epoch": 0.31, "learning_rate": 1.6274236137982066e-05, "loss": 1.3262, "step": 11190 }, { "epoch": 0.31, "learning_rate": 1.62735473670435e-05, "loss": 1.2747, "step": 11191 }, { "epoch": 0.31, "learning_rate": 1.627285854702365e-05, "loss": 1.3281, "step": 11192 }, { "epoch": 0.31, "learning_rate": 1.6272169677927903e-05, "loss": 1.21, "step": 11193 }, { "epoch": 0.31, "learning_rate": 1.6271480759761652e-05, "loss": 1.2495, "step": 11194 }, { "epoch": 0.31, "learning_rate": 1.627079179253028e-05, "loss": 1.425, "step": 11195 }, { "epoch": 0.31, "learning_rate": 1.6270102776239185e-05, "loss": 1.3013, "step": 11196 }, { "epoch": 0.31, "learning_rate": 1.6269413710893752e-05, "loss": 1.429, "step": 11197 }, { "epoch": 0.31, "learning_rate": 1.626872459649938e-05, "loss": 1.1628, "step": 11198 }, { "epoch": 0.31, "learning_rate": 1.6268035433061447e-05, "loss": 1.4397, "step": 11199 }, { "epoch": 0.31, "learning_rate": 1.626734622058536e-05, "loss": 1.374, "step": 11200 }, { "epoch": 0.31, "learning_rate": 1.6266656959076495e-05, "loss": 1.26, "step": 11201 }, { "epoch": 0.31, "learning_rate": 1.626596764854026e-05, "loss": 1.3076, "step": 11202 }, { "epoch": 0.31, "learning_rate": 1.6265278288982032e-05, "loss": 1.4482, "step": 11203 }, { "epoch": 0.31, "learning_rate": 1.6264588880407218e-05, "loss": 1.3049, "step": 11204 }, { "epoch": 0.31, "learning_rate": 1.6263899422821208e-05, "loss": 1.3564, "step": 11205 }, { "epoch": 0.31, "learning_rate": 1.626320991622939e-05, "loss": 1.3345, "step": 11206 }, { "epoch": 0.31, "learning_rate": 1.626252036063717e-05, "loss": 1.1948, "step": 11207 }, { "epoch": 0.31, "learning_rate": 1.626183075604993e-05, "loss": 1.2942, "step": 11208 }, { "epoch": 0.31, "learning_rate": 1.626114110247307e-05, "loss": 1.4277, "step": 11209 }, { "epoch": 0.31, "learning_rate": 1.626045139991199e-05, "loss": 1.1855, "step": 11210 }, { "epoch": 0.31, "learning_rate": 1.6259761648372082e-05, "loss": 1.3416, "step": 11211 }, { "epoch": 0.31, "learning_rate": 1.6259071847858742e-05, "loss": 1.3489, "step": 11212 }, { "epoch": 0.31, "learning_rate": 1.625838199837736e-05, "loss": 1.2324, "step": 11213 }, { "epoch": 0.31, "learning_rate": 1.625769209993335e-05, "loss": 1.3076, "step": 11214 }, { "epoch": 0.31, "learning_rate": 1.6257002152532093e-05, "loss": 1.3982, "step": 11215 }, { "epoch": 0.31, "learning_rate": 1.6256312156178996e-05, "loss": 1.2826, "step": 11216 }, { "epoch": 0.31, "learning_rate": 1.6255622110879456e-05, "loss": 1.4749, "step": 11217 }, { "epoch": 0.31, "learning_rate": 1.6254932016638868e-05, "loss": 1.3342, "step": 11218 }, { "epoch": 0.31, "learning_rate": 1.6254241873462635e-05, "loss": 1.2715, "step": 11219 }, { "epoch": 0.31, "learning_rate": 1.625355168135615e-05, "loss": 1.1824, "step": 11220 }, { "epoch": 0.31, "learning_rate": 1.625286144032482e-05, "loss": 1.396, "step": 11221 }, { "epoch": 0.31, "learning_rate": 1.6252171150374044e-05, "loss": 1.4863, "step": 11222 }, { "epoch": 0.31, "learning_rate": 1.6251480811509223e-05, "loss": 1.28, "step": 11223 }, { "epoch": 0.31, "learning_rate": 1.6250790423735753e-05, "loss": 1.3997, "step": 11224 }, { "epoch": 0.31, "learning_rate": 1.6250099987059036e-05, "loss": 1.2424, "step": 11225 }, { "epoch": 0.31, "learning_rate": 1.6249409501484476e-05, "loss": 1.4722, "step": 11226 }, { "epoch": 0.31, "learning_rate": 1.6248718967017477e-05, "loss": 1.4114, "step": 11227 }, { "epoch": 0.31, "learning_rate": 1.624802838366344e-05, "loss": 1.3823, "step": 11228 }, { "epoch": 0.31, "learning_rate": 1.6247337751427767e-05, "loss": 1.4097, "step": 11229 }, { "epoch": 0.31, "learning_rate": 1.6246647070315857e-05, "loss": 1.2246, "step": 11230 }, { "epoch": 0.31, "learning_rate": 1.624595634033312e-05, "loss": 1.4045, "step": 11231 }, { "epoch": 0.31, "learning_rate": 1.6245265561484957e-05, "loss": 1.4231, "step": 11232 }, { "epoch": 0.31, "learning_rate": 1.6244574733776777e-05, "loss": 1.3657, "step": 11233 }, { "epoch": 0.31, "learning_rate": 1.6243883857213977e-05, "loss": 1.2385, "step": 11234 }, { "epoch": 0.31, "learning_rate": 1.6243192931801967e-05, "loss": 1.3528, "step": 11235 }, { "epoch": 0.31, "learning_rate": 1.6242501957546147e-05, "loss": 1.4209, "step": 11236 }, { "epoch": 0.31, "learning_rate": 1.6241810934451933e-05, "loss": 1.1968, "step": 11237 }, { "epoch": 0.31, "learning_rate": 1.6241119862524724e-05, "loss": 1.2859, "step": 11238 }, { "epoch": 0.31, "learning_rate": 1.6240428741769925e-05, "loss": 1.3877, "step": 11239 }, { "epoch": 0.31, "learning_rate": 1.623973757219295e-05, "loss": 1.3301, "step": 11240 }, { "epoch": 0.31, "learning_rate": 1.6239046353799198e-05, "loss": 1.2859, "step": 11241 }, { "epoch": 0.31, "learning_rate": 1.6238355086594083e-05, "loss": 1.2505, "step": 11242 }, { "epoch": 0.31, "learning_rate": 1.6237663770583014e-05, "loss": 1.3005, "step": 11243 }, { "epoch": 0.31, "learning_rate": 1.623697240577139e-05, "loss": 1.2991, "step": 11244 }, { "epoch": 0.31, "learning_rate": 1.6236280992164634e-05, "loss": 1.3464, "step": 11245 }, { "epoch": 0.31, "learning_rate": 1.6235589529768145e-05, "loss": 1.3281, "step": 11246 }, { "epoch": 0.31, "learning_rate": 1.6234898018587336e-05, "loss": 1.3464, "step": 11247 }, { "epoch": 0.31, "learning_rate": 1.623420645862762e-05, "loss": 1.2993, "step": 11248 }, { "epoch": 0.31, "learning_rate": 1.62335148498944e-05, "loss": 1.3743, "step": 11249 }, { "epoch": 0.31, "learning_rate": 1.623282319239309e-05, "loss": 1.3833, "step": 11250 }, { "epoch": 0.31, "learning_rate": 1.6232131486129103e-05, "loss": 1.2261, "step": 11251 }, { "epoch": 0.31, "learning_rate": 1.623143973110785e-05, "loss": 1.3867, "step": 11252 }, { "epoch": 0.31, "learning_rate": 1.6230747927334746e-05, "loss": 1.2251, "step": 11253 }, { "epoch": 0.31, "learning_rate": 1.62300560748152e-05, "loss": 1.2869, "step": 11254 }, { "epoch": 0.31, "learning_rate": 1.622936417355462e-05, "loss": 1.2156, "step": 11255 }, { "epoch": 0.31, "learning_rate": 1.622867222355843e-05, "loss": 1.4685, "step": 11256 }, { "epoch": 0.31, "learning_rate": 1.622798022483203e-05, "loss": 1.2607, "step": 11257 }, { "epoch": 0.31, "learning_rate": 1.622728817738085e-05, "loss": 1.4741, "step": 11258 }, { "epoch": 0.31, "learning_rate": 1.6226596081210287e-05, "loss": 1.4019, "step": 11259 }, { "epoch": 0.31, "learning_rate": 1.622590393632577e-05, "loss": 1.2744, "step": 11260 }, { "epoch": 0.31, "learning_rate": 1.6225211742732707e-05, "loss": 1.3647, "step": 11261 }, { "epoch": 0.31, "learning_rate": 1.6224519500436514e-05, "loss": 1.447, "step": 11262 }, { "epoch": 0.31, "learning_rate": 1.6223827209442607e-05, "loss": 1.2612, "step": 11263 }, { "epoch": 0.31, "learning_rate": 1.6223134869756405e-05, "loss": 1.3262, "step": 11264 }, { "epoch": 0.31, "learning_rate": 1.622244248138332e-05, "loss": 1.4902, "step": 11265 }, { "epoch": 0.31, "learning_rate": 1.622175004432877e-05, "loss": 1.3276, "step": 11266 }, { "epoch": 0.31, "learning_rate": 1.6221057558598173e-05, "loss": 1.7473, "step": 11267 }, { "epoch": 0.31, "learning_rate": 1.622036502419695e-05, "loss": 1.4707, "step": 11268 }, { "epoch": 0.31, "learning_rate": 1.6219672441130514e-05, "loss": 1.3108, "step": 11269 }, { "epoch": 0.31, "learning_rate": 1.621897980940429e-05, "loss": 1.356, "step": 11270 }, { "epoch": 0.31, "learning_rate": 1.6218287129023685e-05, "loss": 1.498, "step": 11271 }, { "epoch": 0.31, "learning_rate": 1.621759439999413e-05, "loss": 1.2854, "step": 11272 }, { "epoch": 0.31, "learning_rate": 1.621690162232104e-05, "loss": 1.4741, "step": 11273 }, { "epoch": 0.31, "learning_rate": 1.6216208796009835e-05, "loss": 1.3806, "step": 11274 }, { "epoch": 0.31, "learning_rate": 1.6215515921065933e-05, "loss": 1.2483, "step": 11275 }, { "epoch": 0.31, "learning_rate": 1.621482299749476e-05, "loss": 1.3474, "step": 11276 }, { "epoch": 0.31, "learning_rate": 1.621413002530173e-05, "loss": 1.3037, "step": 11277 }, { "epoch": 0.31, "learning_rate": 1.621343700449227e-05, "loss": 1.5166, "step": 11278 }, { "epoch": 0.31, "learning_rate": 1.6212743935071806e-05, "loss": 1.2532, "step": 11279 }, { "epoch": 0.31, "learning_rate": 1.621205081704575e-05, "loss": 1.3777, "step": 11280 }, { "epoch": 0.31, "learning_rate": 1.6211357650419532e-05, "loss": 1.6069, "step": 11281 }, { "epoch": 0.31, "learning_rate": 1.621066443519857e-05, "loss": 1.3611, "step": 11282 }, { "epoch": 0.31, "learning_rate": 1.6209971171388294e-05, "loss": 1.3567, "step": 11283 }, { "epoch": 0.31, "learning_rate": 1.6209277858994118e-05, "loss": 1.2976, "step": 11284 }, { "epoch": 0.31, "learning_rate": 1.6208584498021477e-05, "loss": 1.2959, "step": 11285 }, { "epoch": 0.31, "learning_rate": 1.620789108847579e-05, "loss": 1.1978, "step": 11286 }, { "epoch": 0.31, "learning_rate": 1.620719763036248e-05, "loss": 1.2454, "step": 11287 }, { "epoch": 0.31, "learning_rate": 1.6206504123686975e-05, "loss": 1.2417, "step": 11288 }, { "epoch": 0.31, "learning_rate": 1.6205810568454698e-05, "loss": 1.3694, "step": 11289 }, { "epoch": 0.31, "learning_rate": 1.620511696467108e-05, "loss": 1.2903, "step": 11290 }, { "epoch": 0.31, "learning_rate": 1.6204423312341546e-05, "loss": 1.3721, "step": 11291 }, { "epoch": 0.31, "learning_rate": 1.620372961147152e-05, "loss": 1.2815, "step": 11292 }, { "epoch": 0.31, "learning_rate": 1.6203035862066433e-05, "loss": 1.4302, "step": 11293 }, { "epoch": 0.31, "learning_rate": 1.6202342064131708e-05, "loss": 1.4058, "step": 11294 }, { "epoch": 0.31, "learning_rate": 1.6201648217672775e-05, "loss": 1.3828, "step": 11295 }, { "epoch": 0.31, "learning_rate": 1.620095432269506e-05, "loss": 1.4536, "step": 11296 }, { "epoch": 0.31, "learning_rate": 1.6200260379203994e-05, "loss": 1.3062, "step": 11297 }, { "epoch": 0.31, "learning_rate": 1.619956638720501e-05, "loss": 1.377, "step": 11298 }, { "epoch": 0.31, "learning_rate": 1.6198872346703537e-05, "loss": 1.2156, "step": 11299 }, { "epoch": 0.31, "learning_rate": 1.6198178257704994e-05, "loss": 1.3833, "step": 11300 }, { "epoch": 0.31, "learning_rate": 1.6197484120214827e-05, "loss": 1.2388, "step": 11301 }, { "epoch": 0.31, "learning_rate": 1.6196789934238452e-05, "loss": 1.4026, "step": 11302 }, { "epoch": 0.31, "learning_rate": 1.6196095699781313e-05, "loss": 1.3333, "step": 11303 }, { "epoch": 0.31, "learning_rate": 1.6195401416848827e-05, "loss": 1.291, "step": 11304 }, { "epoch": 0.31, "learning_rate": 1.6194707085446436e-05, "loss": 1.3064, "step": 11305 }, { "epoch": 0.31, "learning_rate": 1.6194012705579574e-05, "loss": 1.3672, "step": 11306 }, { "epoch": 0.31, "learning_rate": 1.6193318277253666e-05, "loss": 1.3389, "step": 11307 }, { "epoch": 0.31, "learning_rate": 1.619262380047415e-05, "loss": 1.3796, "step": 11308 }, { "epoch": 0.31, "learning_rate": 1.6191929275246452e-05, "loss": 1.438, "step": 11309 }, { "epoch": 0.31, "learning_rate": 1.6191234701576016e-05, "loss": 1.321, "step": 11310 }, { "epoch": 0.31, "learning_rate": 1.619054007946827e-05, "loss": 1.2256, "step": 11311 }, { "epoch": 0.31, "learning_rate": 1.618984540892865e-05, "loss": 1.4956, "step": 11312 }, { "epoch": 0.31, "learning_rate": 1.6189150689962587e-05, "loss": 1.3555, "step": 11313 }, { "epoch": 0.31, "learning_rate": 1.6188455922575523e-05, "loss": 1.3831, "step": 11314 }, { "epoch": 0.31, "learning_rate": 1.618776110677289e-05, "loss": 1.397, "step": 11315 }, { "epoch": 0.31, "learning_rate": 1.618706624256012e-05, "loss": 1.4807, "step": 11316 }, { "epoch": 0.31, "learning_rate": 1.6186371329942656e-05, "loss": 1.251, "step": 11317 }, { "epoch": 0.31, "learning_rate": 1.618567636892593e-05, "loss": 1.1023, "step": 11318 }, { "epoch": 0.31, "learning_rate": 1.6184981359515382e-05, "loss": 1.3481, "step": 11319 }, { "epoch": 0.31, "learning_rate": 1.618428630171645e-05, "loss": 1.3206, "step": 11320 }, { "epoch": 0.31, "learning_rate": 1.6183591195534568e-05, "loss": 1.3203, "step": 11321 }, { "epoch": 0.31, "learning_rate": 1.6182896040975174e-05, "loss": 1.2603, "step": 11322 }, { "epoch": 0.31, "learning_rate": 1.618220083804371e-05, "loss": 1.3857, "step": 11323 }, { "epoch": 0.31, "learning_rate": 1.618150558674562e-05, "loss": 1.2126, "step": 11324 }, { "epoch": 0.31, "learning_rate": 1.618081028708633e-05, "loss": 1.479, "step": 11325 }, { "epoch": 0.31, "learning_rate": 1.6180114939071286e-05, "loss": 1.3704, "step": 11326 }, { "epoch": 0.31, "learning_rate": 1.6179419542705934e-05, "loss": 1.3706, "step": 11327 }, { "epoch": 0.31, "learning_rate": 1.6178724097995705e-05, "loss": 1.3098, "step": 11328 }, { "epoch": 0.31, "learning_rate": 1.6178028604946045e-05, "loss": 1.291, "step": 11329 }, { "epoch": 0.31, "learning_rate": 1.6177333063562395e-05, "loss": 1.313, "step": 11330 }, { "epoch": 0.31, "learning_rate": 1.6176637473850195e-05, "loss": 1.2834, "step": 11331 }, { "epoch": 0.31, "learning_rate": 1.617594183581489e-05, "loss": 1.5027, "step": 11332 }, { "epoch": 0.31, "learning_rate": 1.617524614946192e-05, "loss": 1.4709, "step": 11333 }, { "epoch": 0.31, "learning_rate": 1.617455041479673e-05, "loss": 1.4443, "step": 11334 }, { "epoch": 0.31, "learning_rate": 1.6173854631824757e-05, "loss": 1.4438, "step": 11335 }, { "epoch": 0.31, "learning_rate": 1.617315880055145e-05, "loss": 1.3354, "step": 11336 }, { "epoch": 0.31, "learning_rate": 1.617246292098225e-05, "loss": 1.2234, "step": 11337 }, { "epoch": 0.31, "learning_rate": 1.6171766993122604e-05, "loss": 1.415, "step": 11338 }, { "epoch": 0.31, "learning_rate": 1.6171071016977955e-05, "loss": 1.3975, "step": 11339 }, { "epoch": 0.31, "learning_rate": 1.617037499255375e-05, "loss": 1.416, "step": 11340 }, { "epoch": 0.31, "learning_rate": 1.6169678919855428e-05, "loss": 1.4272, "step": 11341 }, { "epoch": 0.31, "learning_rate": 1.6168982798888443e-05, "loss": 1.1946, "step": 11342 }, { "epoch": 0.31, "learning_rate": 1.6168286629658236e-05, "loss": 1.2268, "step": 11343 }, { "epoch": 0.31, "learning_rate": 1.6167590412170254e-05, "loss": 1.3707, "step": 11344 }, { "epoch": 0.31, "learning_rate": 1.6166894146429946e-05, "loss": 1.2222, "step": 11345 }, { "epoch": 0.31, "learning_rate": 1.6166197832442757e-05, "loss": 1.1594, "step": 11346 }, { "epoch": 0.31, "learning_rate": 1.6165501470214138e-05, "loss": 1.312, "step": 11347 }, { "epoch": 0.31, "learning_rate": 1.6164805059749533e-05, "loss": 1.394, "step": 11348 }, { "epoch": 0.31, "learning_rate": 1.6164108601054395e-05, "loss": 1.2751, "step": 11349 }, { "epoch": 0.31, "learning_rate": 1.6163412094134164e-05, "loss": 1.3291, "step": 11350 }, { "epoch": 0.31, "learning_rate": 1.61627155389943e-05, "loss": 1.4399, "step": 11351 }, { "epoch": 0.31, "learning_rate": 1.6162018935640245e-05, "loss": 1.4014, "step": 11352 }, { "epoch": 0.31, "learning_rate": 1.6161322284077453e-05, "loss": 1.3354, "step": 11353 }, { "epoch": 0.31, "learning_rate": 1.6160625584311375e-05, "loss": 1.2954, "step": 11354 }, { "epoch": 0.31, "learning_rate": 1.6159928836347455e-05, "loss": 1.3777, "step": 11355 }, { "epoch": 0.31, "learning_rate": 1.615923204019115e-05, "loss": 1.2927, "step": 11356 }, { "epoch": 0.31, "learning_rate": 1.615853519584791e-05, "loss": 1.3855, "step": 11357 }, { "epoch": 0.31, "learning_rate": 1.6157838303323187e-05, "loss": 1.4253, "step": 11358 }, { "epoch": 0.31, "learning_rate": 1.6157141362622432e-05, "loss": 1.4329, "step": 11359 }, { "epoch": 0.31, "learning_rate": 1.6156444373751096e-05, "loss": 1.2563, "step": 11360 }, { "epoch": 0.31, "learning_rate": 1.6155747336714638e-05, "loss": 1.3135, "step": 11361 }, { "epoch": 0.31, "learning_rate": 1.6155050251518506e-05, "loss": 1.3486, "step": 11362 }, { "epoch": 0.31, "learning_rate": 1.6154353118168154e-05, "loss": 1.2163, "step": 11363 }, { "epoch": 0.31, "learning_rate": 1.6153655936669038e-05, "loss": 1.3608, "step": 11364 }, { "epoch": 0.31, "learning_rate": 1.6152958707026615e-05, "loss": 1.2046, "step": 11365 }, { "epoch": 0.31, "learning_rate": 1.615226142924633e-05, "loss": 1.3694, "step": 11366 }, { "epoch": 0.31, "learning_rate": 1.615156410333365e-05, "loss": 1.4153, "step": 11367 }, { "epoch": 0.31, "learning_rate": 1.6150866729294024e-05, "loss": 1.2961, "step": 11368 }, { "epoch": 0.31, "learning_rate": 1.615016930713291e-05, "loss": 1.4971, "step": 11369 }, { "epoch": 0.31, "learning_rate": 1.6149471836855757e-05, "loss": 1.3906, "step": 11370 }, { "epoch": 0.31, "learning_rate": 1.6148774318468036e-05, "loss": 1.2832, "step": 11371 }, { "epoch": 0.31, "learning_rate": 1.614807675197519e-05, "loss": 1.3877, "step": 11372 }, { "epoch": 0.31, "learning_rate": 1.6147379137382686e-05, "loss": 1.2368, "step": 11373 }, { "epoch": 0.31, "learning_rate": 1.6146681474695977e-05, "loss": 1.3452, "step": 11374 }, { "epoch": 0.31, "learning_rate": 1.6145983763920524e-05, "loss": 1.7271, "step": 11375 }, { "epoch": 0.31, "learning_rate": 1.6145286005061782e-05, "loss": 1.3345, "step": 11376 }, { "epoch": 0.31, "learning_rate": 1.614458819812521e-05, "loss": 1.3452, "step": 11377 }, { "epoch": 0.31, "learning_rate": 1.6143890343116275e-05, "loss": 1.3547, "step": 11378 }, { "epoch": 0.31, "learning_rate": 1.614319244004043e-05, "loss": 1.4131, "step": 11379 }, { "epoch": 0.31, "learning_rate": 1.614249448890313e-05, "loss": 1.3091, "step": 11380 }, { "epoch": 0.31, "learning_rate": 1.614179648970985e-05, "loss": 1.2949, "step": 11381 }, { "epoch": 0.31, "learning_rate": 1.6141098442466035e-05, "loss": 1.3674, "step": 11382 }, { "epoch": 0.31, "learning_rate": 1.6140400347177157e-05, "loss": 1.3989, "step": 11383 }, { "epoch": 0.31, "learning_rate": 1.6139702203848676e-05, "loss": 1.3984, "step": 11384 }, { "epoch": 0.31, "learning_rate": 1.6139004012486052e-05, "loss": 1.1658, "step": 11385 }, { "epoch": 0.31, "learning_rate": 1.613830577309474e-05, "loss": 1.3442, "step": 11386 }, { "epoch": 0.31, "learning_rate": 1.613760748568022e-05, "loss": 1.3467, "step": 11387 }, { "epoch": 0.31, "learning_rate": 1.613690915024794e-05, "loss": 1.2883, "step": 11388 }, { "epoch": 0.31, "learning_rate": 1.613621076680337e-05, "loss": 1.3691, "step": 11389 }, { "epoch": 0.31, "learning_rate": 1.613551233535197e-05, "loss": 1.3083, "step": 11390 }, { "epoch": 0.31, "learning_rate": 1.6134813855899206e-05, "loss": 1.4941, "step": 11391 }, { "epoch": 0.31, "learning_rate": 1.6134115328450547e-05, "loss": 1.2772, "step": 11392 }, { "epoch": 0.31, "learning_rate": 1.613341675301145e-05, "loss": 1.3093, "step": 11393 }, { "epoch": 0.31, "learning_rate": 1.613271812958739e-05, "loss": 1.4868, "step": 11394 }, { "epoch": 0.31, "learning_rate": 1.6132019458183824e-05, "loss": 1.4287, "step": 11395 }, { "epoch": 0.31, "learning_rate": 1.613132073880622e-05, "loss": 1.4561, "step": 11396 }, { "epoch": 0.31, "learning_rate": 1.6130621971460046e-05, "loss": 1.3247, "step": 11397 }, { "epoch": 0.31, "learning_rate": 1.612992315615077e-05, "loss": 1.4983, "step": 11398 }, { "epoch": 0.31, "learning_rate": 1.612922429288386e-05, "loss": 1.751, "step": 11399 }, { "epoch": 0.31, "learning_rate": 1.612852538166478e-05, "loss": 1.2502, "step": 11400 }, { "epoch": 0.31, "learning_rate": 1.6127826422498997e-05, "loss": 1.2446, "step": 11401 }, { "epoch": 0.31, "learning_rate": 1.612712741539198e-05, "loss": 1.2905, "step": 11402 }, { "epoch": 0.31, "learning_rate": 1.6126428360349204e-05, "loss": 1.176, "step": 11403 }, { "epoch": 0.31, "learning_rate": 1.612572925737613e-05, "loss": 1.2441, "step": 11404 }, { "epoch": 0.31, "learning_rate": 1.6125030106478233e-05, "loss": 1.458, "step": 11405 }, { "epoch": 0.31, "learning_rate": 1.6124330907660977e-05, "loss": 1.373, "step": 11406 }, { "epoch": 0.31, "learning_rate": 1.6123631660929838e-05, "loss": 1.3201, "step": 11407 }, { "epoch": 0.31, "learning_rate": 1.6122932366290286e-05, "loss": 1.4846, "step": 11408 }, { "epoch": 0.31, "learning_rate": 1.6122233023747788e-05, "loss": 1.304, "step": 11409 }, { "epoch": 0.31, "learning_rate": 1.612153363330782e-05, "loss": 1.4553, "step": 11410 }, { "epoch": 0.31, "learning_rate": 1.612083419497585e-05, "loss": 1.2542, "step": 11411 }, { "epoch": 0.31, "learning_rate": 1.612013470875735e-05, "loss": 1.2146, "step": 11412 }, { "epoch": 0.31, "learning_rate": 1.6119435174657797e-05, "loss": 1.3699, "step": 11413 }, { "epoch": 0.31, "learning_rate": 1.6118735592682663e-05, "loss": 1.2476, "step": 11414 }, { "epoch": 0.31, "learning_rate": 1.6118035962837414e-05, "loss": 1.25, "step": 11415 }, { "epoch": 0.31, "learning_rate": 1.6117336285127527e-05, "loss": 1.4224, "step": 11416 }, { "epoch": 0.31, "learning_rate": 1.6116636559558482e-05, "loss": 1.3743, "step": 11417 }, { "epoch": 0.31, "learning_rate": 1.611593678613575e-05, "loss": 1.1915, "step": 11418 }, { "epoch": 0.31, "learning_rate": 1.6115236964864798e-05, "loss": 1.5151, "step": 11419 }, { "epoch": 0.31, "learning_rate": 1.6114537095751112e-05, "loss": 1.3623, "step": 11420 }, { "epoch": 0.31, "learning_rate": 1.611383717880016e-05, "loss": 1.2786, "step": 11421 }, { "epoch": 0.31, "learning_rate": 1.6113137214017424e-05, "loss": 1.4514, "step": 11422 }, { "epoch": 0.31, "learning_rate": 1.6112437201408378e-05, "loss": 1.2722, "step": 11423 }, { "epoch": 0.31, "learning_rate": 1.6111737140978495e-05, "loss": 1.406, "step": 11424 }, { "epoch": 0.31, "learning_rate": 1.6111037032733253e-05, "loss": 1.2251, "step": 11425 }, { "epoch": 0.31, "learning_rate": 1.6110336876678134e-05, "loss": 1.2666, "step": 11426 }, { "epoch": 0.31, "learning_rate": 1.6109636672818613e-05, "loss": 1.3748, "step": 11427 }, { "epoch": 0.31, "learning_rate": 1.6108936421160166e-05, "loss": 1.2986, "step": 11428 }, { "epoch": 0.31, "learning_rate": 1.6108236121708275e-05, "loss": 1.2861, "step": 11429 }, { "epoch": 0.31, "learning_rate": 1.6107535774468414e-05, "loss": 1.3757, "step": 11430 }, { "epoch": 0.31, "learning_rate": 1.6106835379446066e-05, "loss": 1.3533, "step": 11431 }, { "epoch": 0.31, "learning_rate": 1.610613493664671e-05, "loss": 1.2039, "step": 11432 }, { "epoch": 0.31, "learning_rate": 1.6105434446075827e-05, "loss": 1.3828, "step": 11433 }, { "epoch": 0.31, "learning_rate": 1.6104733907738893e-05, "loss": 1.7837, "step": 11434 }, { "epoch": 0.31, "learning_rate": 1.6104033321641392e-05, "loss": 1.4722, "step": 11435 }, { "epoch": 0.31, "learning_rate": 1.6103332687788808e-05, "loss": 1.376, "step": 11436 }, { "epoch": 0.31, "learning_rate": 1.6102632006186615e-05, "loss": 1.2749, "step": 11437 }, { "epoch": 0.31, "learning_rate": 1.61019312768403e-05, "loss": 1.5039, "step": 11438 }, { "epoch": 0.31, "learning_rate": 1.6101230499755344e-05, "loss": 1.2964, "step": 11439 }, { "epoch": 0.31, "learning_rate": 1.610052967493723e-05, "loss": 1.2847, "step": 11440 }, { "epoch": 0.31, "learning_rate": 1.609982880239144e-05, "loss": 1.3123, "step": 11441 }, { "epoch": 0.31, "learning_rate": 1.609912788212346e-05, "loss": 1.3762, "step": 11442 }, { "epoch": 0.31, "learning_rate": 1.609842691413877e-05, "loss": 1.2878, "step": 11443 }, { "epoch": 0.31, "learning_rate": 1.6097725898442855e-05, "loss": 1.2334, "step": 11444 }, { "epoch": 0.31, "learning_rate": 1.60970248350412e-05, "loss": 1.2622, "step": 11445 }, { "epoch": 0.31, "learning_rate": 1.609632372393929e-05, "loss": 1.4006, "step": 11446 }, { "epoch": 0.31, "learning_rate": 1.609562256514261e-05, "loss": 1.3926, "step": 11447 }, { "epoch": 0.31, "learning_rate": 1.6094921358656645e-05, "loss": 1.4546, "step": 11448 }, { "epoch": 0.31, "learning_rate": 1.609422010448688e-05, "loss": 1.3489, "step": 11449 }, { "epoch": 0.31, "learning_rate": 1.6093518802638806e-05, "loss": 1.2986, "step": 11450 }, { "epoch": 0.31, "learning_rate": 1.6092817453117903e-05, "loss": 1.1204, "step": 11451 }, { "epoch": 0.31, "learning_rate": 1.6092116055929662e-05, "loss": 1.3474, "step": 11452 }, { "epoch": 0.31, "learning_rate": 1.609141461107957e-05, "loss": 1.4067, "step": 11453 }, { "epoch": 0.31, "learning_rate": 1.6090713118573117e-05, "loss": 1.3818, "step": 11454 }, { "epoch": 0.31, "learning_rate": 1.6090011578415788e-05, "loss": 1.418, "step": 11455 }, { "epoch": 0.31, "learning_rate": 1.608930999061307e-05, "loss": 1.301, "step": 11456 }, { "epoch": 0.31, "learning_rate": 1.6088608355170455e-05, "loss": 1.3291, "step": 11457 }, { "epoch": 0.31, "learning_rate": 1.608790667209343e-05, "loss": 1.3589, "step": 11458 }, { "epoch": 0.31, "learning_rate": 1.6087204941387486e-05, "loss": 1.3342, "step": 11459 }, { "epoch": 0.31, "learning_rate": 1.6086503163058112e-05, "loss": 1.332, "step": 11460 }, { "epoch": 0.31, "learning_rate": 1.6085801337110806e-05, "loss": 1.79, "step": 11461 }, { "epoch": 0.31, "learning_rate": 1.6085099463551042e-05, "loss": 1.2502, "step": 11462 }, { "epoch": 0.31, "learning_rate": 1.608439754238433e-05, "loss": 1.2949, "step": 11463 }, { "epoch": 0.31, "learning_rate": 1.608369557361615e-05, "loss": 1.323, "step": 11464 }, { "epoch": 0.31, "learning_rate": 1.6082993557251994e-05, "loss": 1.2068, "step": 11465 }, { "epoch": 0.31, "learning_rate": 1.608229149329736e-05, "loss": 1.3398, "step": 11466 }, { "epoch": 0.31, "learning_rate": 1.6081589381757738e-05, "loss": 1.4419, "step": 11467 }, { "epoch": 0.31, "learning_rate": 1.6080887222638614e-05, "loss": 1.4438, "step": 11468 }, { "epoch": 0.31, "learning_rate": 1.608018501594549e-05, "loss": 1.228, "step": 11469 }, { "epoch": 0.31, "learning_rate": 1.6079482761683863e-05, "loss": 1.199, "step": 11470 }, { "epoch": 0.31, "learning_rate": 1.6078780459859216e-05, "loss": 1.2043, "step": 11471 }, { "epoch": 0.31, "learning_rate": 1.6078078110477055e-05, "loss": 1.2827, "step": 11472 }, { "epoch": 0.31, "learning_rate": 1.6077375713542863e-05, "loss": 1.3352, "step": 11473 }, { "epoch": 0.31, "learning_rate": 1.6076673269062144e-05, "loss": 1.4292, "step": 11474 }, { "epoch": 0.31, "learning_rate": 1.607597077704039e-05, "loss": 1.4326, "step": 11475 }, { "epoch": 0.31, "learning_rate": 1.6075268237483103e-05, "loss": 1.1956, "step": 11476 }, { "epoch": 0.31, "learning_rate": 1.6074565650395764e-05, "loss": 1.4924, "step": 11477 }, { "epoch": 0.31, "learning_rate": 1.6073863015783887e-05, "loss": 1.3088, "step": 11478 }, { "epoch": 0.31, "learning_rate": 1.607316033365296e-05, "loss": 1.2336, "step": 11479 }, { "epoch": 0.31, "learning_rate": 1.6072457604008486e-05, "loss": 1.4048, "step": 11480 }, { "epoch": 0.31, "learning_rate": 1.6071754826855953e-05, "loss": 1.3628, "step": 11481 }, { "epoch": 0.31, "learning_rate": 1.6071052002200867e-05, "loss": 1.2671, "step": 11482 }, { "epoch": 0.31, "learning_rate": 1.6070349130048724e-05, "loss": 1.2972, "step": 11483 }, { "epoch": 0.31, "learning_rate": 1.606964621040503e-05, "loss": 1.4629, "step": 11484 }, { "epoch": 0.31, "learning_rate": 1.606894324327527e-05, "loss": 1.3237, "step": 11485 }, { "epoch": 0.31, "learning_rate": 1.6068240228664956e-05, "loss": 1.22, "step": 11486 }, { "epoch": 0.31, "learning_rate": 1.6067537166579586e-05, "loss": 1.252, "step": 11487 }, { "epoch": 0.31, "learning_rate": 1.6066834057024657e-05, "loss": 1.2798, "step": 11488 }, { "epoch": 0.31, "learning_rate": 1.606613090000567e-05, "loss": 1.3833, "step": 11489 }, { "epoch": 0.31, "learning_rate": 1.606542769552813e-05, "loss": 1.3948, "step": 11490 }, { "epoch": 0.31, "learning_rate": 1.6064724443597532e-05, "loss": 1.5664, "step": 11491 }, { "epoch": 0.31, "learning_rate": 1.6064021144219385e-05, "loss": 1.2659, "step": 11492 }, { "epoch": 0.31, "learning_rate": 1.6063317797399184e-05, "loss": 1.4102, "step": 11493 }, { "epoch": 0.31, "learning_rate": 1.6062614403142437e-05, "loss": 1.3716, "step": 11494 }, { "epoch": 0.31, "learning_rate": 1.606191096145465e-05, "loss": 1.218, "step": 11495 }, { "epoch": 0.31, "learning_rate": 1.6061207472341317e-05, "loss": 1.2715, "step": 11496 }, { "epoch": 0.31, "learning_rate": 1.606050393580795e-05, "loss": 1.4775, "step": 11497 }, { "epoch": 0.31, "learning_rate": 1.605980035186005e-05, "loss": 1.1665, "step": 11498 }, { "epoch": 0.31, "learning_rate": 1.6059096720503117e-05, "loss": 1.2515, "step": 11499 }, { "epoch": 0.31, "learning_rate": 1.6058393041742667e-05, "loss": 1.345, "step": 11500 }, { "epoch": 0.31, "learning_rate": 1.6057689315584192e-05, "loss": 1.1221, "step": 11501 }, { "epoch": 0.31, "learning_rate": 1.605698554203321e-05, "loss": 1.4082, "step": 11502 }, { "epoch": 0.31, "learning_rate": 1.605628172109522e-05, "loss": 1.3184, "step": 11503 }, { "epoch": 0.31, "learning_rate": 1.605557785277573e-05, "loss": 1.522, "step": 11504 }, { "epoch": 0.31, "learning_rate": 1.6054873937080248e-05, "loss": 1.4067, "step": 11505 }, { "epoch": 0.31, "learning_rate": 1.6054169974014273e-05, "loss": 1.4375, "step": 11506 }, { "epoch": 0.31, "learning_rate": 1.6053465963583324e-05, "loss": 1.2849, "step": 11507 }, { "epoch": 0.31, "learning_rate": 1.6052761905792903e-05, "loss": 1.2444, "step": 11508 }, { "epoch": 0.31, "learning_rate": 1.6052057800648516e-05, "loss": 1.3833, "step": 11509 }, { "epoch": 0.31, "learning_rate": 1.6051353648155678e-05, "loss": 1.3457, "step": 11510 }, { "epoch": 0.31, "learning_rate": 1.6050649448319898e-05, "loss": 1.3987, "step": 11511 }, { "epoch": 0.31, "learning_rate": 1.6049945201146676e-05, "loss": 1.3857, "step": 11512 }, { "epoch": 0.31, "learning_rate": 1.604924090664153e-05, "loss": 1.3955, "step": 11513 }, { "epoch": 0.31, "learning_rate": 1.6048536564809967e-05, "loss": 1.2983, "step": 11514 }, { "epoch": 0.31, "learning_rate": 1.60478321756575e-05, "loss": 1.3945, "step": 11515 }, { "epoch": 0.31, "learning_rate": 1.6047127739189635e-05, "loss": 1.4751, "step": 11516 }, { "epoch": 0.31, "learning_rate": 1.6046423255411888e-05, "loss": 1.2991, "step": 11517 }, { "epoch": 0.31, "learning_rate": 1.6045718724329766e-05, "loss": 1.4133, "step": 11518 }, { "epoch": 0.31, "learning_rate": 1.6045014145948786e-05, "loss": 1.4309, "step": 11519 }, { "epoch": 0.31, "learning_rate": 1.604430952027446e-05, "loss": 1.4326, "step": 11520 }, { "epoch": 0.31, "learning_rate": 1.6043604847312296e-05, "loss": 1.2988, "step": 11521 }, { "epoch": 0.31, "learning_rate": 1.604290012706781e-05, "loss": 1.3015, "step": 11522 }, { "epoch": 0.31, "learning_rate": 1.6042195359546516e-05, "loss": 1.4119, "step": 11523 }, { "epoch": 0.31, "learning_rate": 1.6041490544753924e-05, "loss": 1.2969, "step": 11524 }, { "epoch": 0.31, "learning_rate": 1.6040785682695555e-05, "loss": 1.2805, "step": 11525 }, { "epoch": 0.31, "learning_rate": 1.6040080773376915e-05, "loss": 1.355, "step": 11526 }, { "epoch": 0.31, "learning_rate": 1.6039375816803526e-05, "loss": 1.6479, "step": 11527 }, { "epoch": 0.31, "learning_rate": 1.60386708129809e-05, "loss": 1.25, "step": 11528 }, { "epoch": 0.31, "learning_rate": 1.603796576191455e-05, "loss": 1.3806, "step": 11529 }, { "epoch": 0.31, "learning_rate": 1.603726066361e-05, "loss": 1.2966, "step": 11530 }, { "epoch": 0.31, "learning_rate": 1.603655551807276e-05, "loss": 1.4785, "step": 11531 }, { "epoch": 0.31, "learning_rate": 1.6035850325308346e-05, "loss": 1.2988, "step": 11532 }, { "epoch": 0.31, "learning_rate": 1.6035145085322277e-05, "loss": 1.3237, "step": 11533 }, { "epoch": 0.31, "learning_rate": 1.6034439798120074e-05, "loss": 1.2444, "step": 11534 }, { "epoch": 0.32, "learning_rate": 1.603373446370725e-05, "loss": 1.3953, "step": 11535 }, { "epoch": 0.32, "learning_rate": 1.6033029082089327e-05, "loss": 1.2626, "step": 11536 }, { "epoch": 0.32, "learning_rate": 1.603232365327182e-05, "loss": 1.4116, "step": 11537 }, { "epoch": 0.32, "learning_rate": 1.603161817726025e-05, "loss": 1.4019, "step": 11538 }, { "epoch": 0.32, "learning_rate": 1.6030912654060135e-05, "loss": 1.3115, "step": 11539 }, { "epoch": 0.32, "learning_rate": 1.6030207083676993e-05, "loss": 1.2847, "step": 11540 }, { "epoch": 0.32, "learning_rate": 1.6029501466116348e-05, "loss": 1.2324, "step": 11541 }, { "epoch": 0.32, "learning_rate": 1.6028795801383717e-05, "loss": 1.2625, "step": 11542 }, { "epoch": 0.32, "learning_rate": 1.6028090089484626e-05, "loss": 1.3369, "step": 11543 }, { "epoch": 0.32, "learning_rate": 1.6027384330424593e-05, "loss": 1.2253, "step": 11544 }, { "epoch": 0.32, "learning_rate": 1.6026678524209138e-05, "loss": 1.3176, "step": 11545 }, { "epoch": 0.32, "learning_rate": 1.602597267084378e-05, "loss": 1.3799, "step": 11546 }, { "epoch": 0.32, "learning_rate": 1.602526677033405e-05, "loss": 1.4878, "step": 11547 }, { "epoch": 0.32, "learning_rate": 1.6024560822685466e-05, "loss": 1.2878, "step": 11548 }, { "epoch": 0.32, "learning_rate": 1.602385482790355e-05, "loss": 1.4414, "step": 11549 }, { "epoch": 0.32, "learning_rate": 1.602314878599383e-05, "loss": 1.2808, "step": 11550 }, { "epoch": 0.32, "learning_rate": 1.6022442696961822e-05, "loss": 1.4631, "step": 11551 }, { "epoch": 0.32, "learning_rate": 1.6021736560813055e-05, "loss": 1.3445, "step": 11552 }, { "epoch": 0.32, "learning_rate": 1.6021030377553054e-05, "loss": 1.3396, "step": 11553 }, { "epoch": 0.32, "learning_rate": 1.6020324147187342e-05, "loss": 1.2397, "step": 11554 }, { "epoch": 0.32, "learning_rate": 1.6019617869721444e-05, "loss": 1.4316, "step": 11555 }, { "epoch": 0.32, "learning_rate": 1.6018911545160888e-05, "loss": 1.355, "step": 11556 }, { "epoch": 0.32, "learning_rate": 1.6018205173511198e-05, "loss": 1.3121, "step": 11557 }, { "epoch": 0.32, "learning_rate": 1.6017498754777898e-05, "loss": 1.3005, "step": 11558 }, { "epoch": 0.32, "learning_rate": 1.6016792288966517e-05, "loss": 1.3103, "step": 11559 }, { "epoch": 0.32, "learning_rate": 1.6016085776082587e-05, "loss": 1.4465, "step": 11560 }, { "epoch": 0.32, "learning_rate": 1.601537921613163e-05, "loss": 1.4736, "step": 11561 }, { "epoch": 0.32, "learning_rate": 1.601467260911917e-05, "loss": 1.4692, "step": 11562 }, { "epoch": 0.32, "learning_rate": 1.6013965955050746e-05, "loss": 1.3052, "step": 11563 }, { "epoch": 0.32, "learning_rate": 1.6013259253931878e-05, "loss": 1.3005, "step": 11564 }, { "epoch": 0.32, "learning_rate": 1.6012552505768094e-05, "loss": 1.2903, "step": 11565 }, { "epoch": 0.32, "learning_rate": 1.601184571056493e-05, "loss": 1.2407, "step": 11566 }, { "epoch": 0.32, "learning_rate": 1.6011138868327912e-05, "loss": 1.3594, "step": 11567 }, { "epoch": 0.32, "learning_rate": 1.601043197906257e-05, "loss": 1.7446, "step": 11568 }, { "epoch": 0.32, "learning_rate": 1.6009725042774434e-05, "loss": 1.3682, "step": 11569 }, { "epoch": 0.32, "learning_rate": 1.6009018059469036e-05, "loss": 1.2961, "step": 11570 }, { "epoch": 0.32, "learning_rate": 1.6008311029151907e-05, "loss": 1.418, "step": 11571 }, { "epoch": 0.32, "learning_rate": 1.6007603951828576e-05, "loss": 1.301, "step": 11572 }, { "epoch": 0.32, "learning_rate": 1.6006896827504575e-05, "loss": 1.3992, "step": 11573 }, { "epoch": 0.32, "learning_rate": 1.600618965618544e-05, "loss": 1.1807, "step": 11574 }, { "epoch": 0.32, "learning_rate": 1.60054824378767e-05, "loss": 1.2734, "step": 11575 }, { "epoch": 0.32, "learning_rate": 1.6004775172583893e-05, "loss": 1.3982, "step": 11576 }, { "epoch": 0.32, "learning_rate": 1.6004067860312545e-05, "loss": 1.3835, "step": 11577 }, { "epoch": 0.32, "learning_rate": 1.6003360501068192e-05, "loss": 1.239, "step": 11578 }, { "epoch": 0.32, "learning_rate": 1.6002653094856374e-05, "loss": 1.2866, "step": 11579 }, { "epoch": 0.32, "learning_rate": 1.600194564168262e-05, "loss": 1.262, "step": 11580 }, { "epoch": 0.32, "learning_rate": 1.6001238141552466e-05, "loss": 1.4097, "step": 11581 }, { "epoch": 0.32, "learning_rate": 1.6000530594471442e-05, "loss": 1.3782, "step": 11582 }, { "epoch": 0.32, "learning_rate": 1.599982300044509e-05, "loss": 1.2988, "step": 11583 }, { "epoch": 0.32, "learning_rate": 1.5999115359478948e-05, "loss": 1.502, "step": 11584 }, { "epoch": 0.32, "learning_rate": 1.5998407671578548e-05, "loss": 1.1257, "step": 11585 }, { "epoch": 0.32, "learning_rate": 1.5997699936749425e-05, "loss": 1.2129, "step": 11586 }, { "epoch": 0.32, "learning_rate": 1.5996992154997117e-05, "loss": 1.4421, "step": 11587 }, { "epoch": 0.32, "learning_rate": 1.5996284326327165e-05, "loss": 1.3948, "step": 11588 }, { "epoch": 0.32, "learning_rate": 1.5995576450745104e-05, "loss": 1.2549, "step": 11589 }, { "epoch": 0.32, "learning_rate": 1.599486852825647e-05, "loss": 1.335, "step": 11590 }, { "epoch": 0.32, "learning_rate": 1.5994160558866803e-05, "loss": 1.2539, "step": 11591 }, { "epoch": 0.32, "learning_rate": 1.5993452542581646e-05, "loss": 1.1824, "step": 11592 }, { "epoch": 0.32, "learning_rate": 1.599274447940653e-05, "loss": 1.408, "step": 11593 }, { "epoch": 0.32, "learning_rate": 1.5992036369347003e-05, "loss": 1.5547, "step": 11594 }, { "epoch": 0.32, "learning_rate": 1.59913282124086e-05, "loss": 1.21, "step": 11595 }, { "epoch": 0.32, "learning_rate": 1.5990620008596863e-05, "loss": 1.3945, "step": 11596 }, { "epoch": 0.32, "learning_rate": 1.598991175791733e-05, "loss": 1.1992, "step": 11597 }, { "epoch": 0.32, "learning_rate": 1.5989203460375543e-05, "loss": 1.2839, "step": 11598 }, { "epoch": 0.32, "learning_rate": 1.5988495115977046e-05, "loss": 1.2778, "step": 11599 }, { "epoch": 0.32, "learning_rate": 1.5987786724727385e-05, "loss": 1.1895, "step": 11600 }, { "epoch": 0.32, "learning_rate": 1.5987078286632088e-05, "loss": 1.2888, "step": 11601 }, { "epoch": 0.32, "learning_rate": 1.598636980169671e-05, "loss": 1.4331, "step": 11602 }, { "epoch": 0.32, "learning_rate": 1.598566126992679e-05, "loss": 1.311, "step": 11603 }, { "epoch": 0.32, "learning_rate": 1.598495269132787e-05, "loss": 1.3411, "step": 11604 }, { "epoch": 0.32, "learning_rate": 1.5984244065905495e-05, "loss": 1.4036, "step": 11605 }, { "epoch": 0.32, "learning_rate": 1.5983535393665202e-05, "loss": 1.2766, "step": 11606 }, { "epoch": 0.32, "learning_rate": 1.598282667461255e-05, "loss": 1.1094, "step": 11607 }, { "epoch": 0.32, "learning_rate": 1.598211790875307e-05, "loss": 1.3403, "step": 11608 }, { "epoch": 0.32, "learning_rate": 1.5981409096092317e-05, "loss": 1.415, "step": 11609 }, { "epoch": 0.32, "learning_rate": 1.5980700236635833e-05, "loss": 1.728, "step": 11610 }, { "epoch": 0.32, "learning_rate": 1.5979991330389157e-05, "loss": 1.4207, "step": 11611 }, { "epoch": 0.32, "learning_rate": 1.5979282377357846e-05, "loss": 1.3884, "step": 11612 }, { "epoch": 0.32, "learning_rate": 1.5978573377547436e-05, "loss": 1.5259, "step": 11613 }, { "epoch": 0.32, "learning_rate": 1.5977864330963484e-05, "loss": 1.3757, "step": 11614 }, { "epoch": 0.32, "learning_rate": 1.597715523761153e-05, "loss": 1.4072, "step": 11615 }, { "epoch": 0.32, "learning_rate": 1.5976446097497125e-05, "loss": 1.3828, "step": 11616 }, { "epoch": 0.32, "learning_rate": 1.5975736910625818e-05, "loss": 1.3684, "step": 11617 }, { "epoch": 0.32, "learning_rate": 1.597502767700315e-05, "loss": 1.2446, "step": 11618 }, { "epoch": 0.32, "learning_rate": 1.597431839663468e-05, "loss": 1.3335, "step": 11619 }, { "epoch": 0.32, "learning_rate": 1.5973609069525952e-05, "loss": 1.3088, "step": 11620 }, { "epoch": 0.32, "learning_rate": 1.597289969568251e-05, "loss": 1.3706, "step": 11621 }, { "epoch": 0.32, "learning_rate": 1.5972190275109913e-05, "loss": 1.2952, "step": 11622 }, { "epoch": 0.32, "learning_rate": 1.597148080781371e-05, "loss": 1.3267, "step": 11623 }, { "epoch": 0.32, "learning_rate": 1.5970771293799446e-05, "loss": 1.4272, "step": 11624 }, { "epoch": 0.32, "learning_rate": 1.597006173307268e-05, "loss": 1.5205, "step": 11625 }, { "epoch": 0.32, "learning_rate": 1.596935212563895e-05, "loss": 1.4551, "step": 11626 }, { "epoch": 0.32, "learning_rate": 1.596864247150382e-05, "loss": 1.4724, "step": 11627 }, { "epoch": 0.32, "learning_rate": 1.596793277067284e-05, "loss": 1.793, "step": 11628 }, { "epoch": 0.32, "learning_rate": 1.596722302315156e-05, "loss": 1.3047, "step": 11629 }, { "epoch": 0.32, "learning_rate": 1.596651322894553e-05, "loss": 1.1946, "step": 11630 }, { "epoch": 0.32, "learning_rate": 1.596580338806031e-05, "loss": 1.3086, "step": 11631 }, { "epoch": 0.32, "learning_rate": 1.5965093500501446e-05, "loss": 1.4453, "step": 11632 }, { "epoch": 0.32, "learning_rate": 1.5964383566274498e-05, "loss": 1.1348, "step": 11633 }, { "epoch": 0.32, "learning_rate": 1.5963673585385016e-05, "loss": 1.3472, "step": 11634 }, { "epoch": 0.32, "learning_rate": 1.5962963557838557e-05, "loss": 1.5, "step": 11635 }, { "epoch": 0.32, "learning_rate": 1.5962253483640674e-05, "loss": 1.3433, "step": 11636 }, { "epoch": 0.32, "learning_rate": 1.5961543362796924e-05, "loss": 1.2969, "step": 11637 }, { "epoch": 0.32, "learning_rate": 1.5960833195312863e-05, "loss": 1.4297, "step": 11638 }, { "epoch": 0.32, "learning_rate": 1.5960122981194045e-05, "loss": 1.4082, "step": 11639 }, { "epoch": 0.32, "learning_rate": 1.595941272044603e-05, "loss": 1.2764, "step": 11640 }, { "epoch": 0.32, "learning_rate": 1.595870241307437e-05, "loss": 1.2151, "step": 11641 }, { "epoch": 0.32, "learning_rate": 1.5957992059084624e-05, "loss": 1.3708, "step": 11642 }, { "epoch": 0.32, "learning_rate": 1.5957281658482348e-05, "loss": 1.4751, "step": 11643 }, { "epoch": 0.32, "learning_rate": 1.5956571211273103e-05, "loss": 1.3948, "step": 11644 }, { "epoch": 0.32, "learning_rate": 1.5955860717462447e-05, "loss": 1.3313, "step": 11645 }, { "epoch": 0.32, "learning_rate": 1.5955150177055937e-05, "loss": 1.3313, "step": 11646 }, { "epoch": 0.32, "learning_rate": 1.5954439590059134e-05, "loss": 1.3198, "step": 11647 }, { "epoch": 0.32, "learning_rate": 1.5953728956477596e-05, "loss": 1.415, "step": 11648 }, { "epoch": 0.32, "learning_rate": 1.595301827631688e-05, "loss": 1.355, "step": 11649 }, { "epoch": 0.32, "learning_rate": 1.5952307549582548e-05, "loss": 1.4712, "step": 11650 }, { "epoch": 0.32, "learning_rate": 1.595159677628016e-05, "loss": 1.3958, "step": 11651 }, { "epoch": 0.32, "learning_rate": 1.5950885956415278e-05, "loss": 1.3525, "step": 11652 }, { "epoch": 0.32, "learning_rate": 1.5950175089993463e-05, "loss": 1.4646, "step": 11653 }, { "epoch": 0.32, "learning_rate": 1.5949464177020276e-05, "loss": 1.1035, "step": 11654 }, { "epoch": 0.32, "learning_rate": 1.594875321750128e-05, "loss": 1.3452, "step": 11655 }, { "epoch": 0.32, "learning_rate": 1.5948042211442035e-05, "loss": 1.4141, "step": 11656 }, { "epoch": 0.32, "learning_rate": 1.5947331158848104e-05, "loss": 1.3796, "step": 11657 }, { "epoch": 0.32, "learning_rate": 1.5946620059725054e-05, "loss": 1.3035, "step": 11658 }, { "epoch": 0.32, "learning_rate": 1.5945908914078442e-05, "loss": 1.4368, "step": 11659 }, { "epoch": 0.32, "learning_rate": 1.5945197721913834e-05, "loss": 1.4585, "step": 11660 }, { "epoch": 0.32, "learning_rate": 1.5944486483236797e-05, "loss": 1.3962, "step": 11661 }, { "epoch": 0.32, "learning_rate": 1.5943775198052894e-05, "loss": 1.446, "step": 11662 }, { "epoch": 0.32, "learning_rate": 1.5943063866367686e-05, "loss": 1.4282, "step": 11663 }, { "epoch": 0.32, "learning_rate": 1.594235248818674e-05, "loss": 1.2456, "step": 11664 }, { "epoch": 0.32, "learning_rate": 1.5941641063515625e-05, "loss": 1.13, "step": 11665 }, { "epoch": 0.32, "learning_rate": 1.5940929592359903e-05, "loss": 1.2537, "step": 11666 }, { "epoch": 0.32, "learning_rate": 1.594021807472514e-05, "loss": 1.3247, "step": 11667 }, { "epoch": 0.32, "learning_rate": 1.5939506510616907e-05, "loss": 1.3779, "step": 11668 }, { "epoch": 0.32, "learning_rate": 1.5938794900040768e-05, "loss": 1.3462, "step": 11669 }, { "epoch": 0.32, "learning_rate": 1.593808324300229e-05, "loss": 1.3091, "step": 11670 }, { "epoch": 0.32, "learning_rate": 1.593737153950704e-05, "loss": 1.2778, "step": 11671 }, { "epoch": 0.32, "learning_rate": 1.5936659789560587e-05, "loss": 1.3733, "step": 11672 }, { "epoch": 0.32, "learning_rate": 1.5935947993168502e-05, "loss": 1.1802, "step": 11673 }, { "epoch": 0.32, "learning_rate": 1.5935236150336345e-05, "loss": 1.3096, "step": 11674 }, { "epoch": 0.32, "learning_rate": 1.5934524261069697e-05, "loss": 1.2688, "step": 11675 }, { "epoch": 0.32, "learning_rate": 1.593381232537412e-05, "loss": 1.4111, "step": 11676 }, { "epoch": 0.32, "learning_rate": 1.5933100343255184e-05, "loss": 1.2407, "step": 11677 }, { "epoch": 0.32, "learning_rate": 1.5932388314718467e-05, "loss": 1.4346, "step": 11678 }, { "epoch": 0.32, "learning_rate": 1.5931676239769528e-05, "loss": 1.3721, "step": 11679 }, { "epoch": 0.32, "learning_rate": 1.5930964118413944e-05, "loss": 1.3574, "step": 11680 }, { "epoch": 0.32, "learning_rate": 1.5930251950657286e-05, "loss": 1.2937, "step": 11681 }, { "epoch": 0.32, "learning_rate": 1.5929539736505123e-05, "loss": 1.2739, "step": 11682 }, { "epoch": 0.32, "learning_rate": 1.5928827475963032e-05, "loss": 1.3525, "step": 11683 }, { "epoch": 0.32, "learning_rate": 1.5928115169036584e-05, "loss": 1.3281, "step": 11684 }, { "epoch": 0.32, "learning_rate": 1.5927402815731348e-05, "loss": 1.1829, "step": 11685 }, { "epoch": 0.32, "learning_rate": 1.5926690416052898e-05, "loss": 1.3442, "step": 11686 }, { "epoch": 0.32, "learning_rate": 1.5925977970006814e-05, "loss": 1.5125, "step": 11687 }, { "epoch": 0.32, "learning_rate": 1.5925265477598662e-05, "loss": 1.3096, "step": 11688 }, { "epoch": 0.32, "learning_rate": 1.5924552938834018e-05, "loss": 1.3833, "step": 11689 }, { "epoch": 0.32, "learning_rate": 1.5923840353718463e-05, "loss": 1.3672, "step": 11690 }, { "epoch": 0.32, "learning_rate": 1.5923127722257565e-05, "loss": 1.4346, "step": 11691 }, { "epoch": 0.32, "learning_rate": 1.5922415044456897e-05, "loss": 1.4541, "step": 11692 }, { "epoch": 0.32, "learning_rate": 1.5921702320322042e-05, "loss": 1.2625, "step": 11693 }, { "epoch": 0.32, "learning_rate": 1.592098954985857e-05, "loss": 1.4702, "step": 11694 }, { "epoch": 0.32, "learning_rate": 1.5920276733072062e-05, "loss": 1.0886, "step": 11695 }, { "epoch": 0.32, "learning_rate": 1.591956386996809e-05, "loss": 1.53, "step": 11696 }, { "epoch": 0.32, "learning_rate": 1.591885096055224e-05, "loss": 1.2224, "step": 11697 }, { "epoch": 0.32, "learning_rate": 1.5918138004830077e-05, "loss": 1.3359, "step": 11698 }, { "epoch": 0.32, "learning_rate": 1.591742500280719e-05, "loss": 1.4812, "step": 11699 }, { "epoch": 0.32, "learning_rate": 1.591671195448915e-05, "loss": 1.3967, "step": 11700 }, { "epoch": 0.32, "learning_rate": 1.5915998859881535e-05, "loss": 1.158, "step": 11701 }, { "epoch": 0.32, "learning_rate": 1.591528571898993e-05, "loss": 1.3496, "step": 11702 }, { "epoch": 0.32, "learning_rate": 1.591457253181991e-05, "loss": 1.3201, "step": 11703 }, { "epoch": 0.32, "learning_rate": 1.5913859298377054e-05, "loss": 1.3589, "step": 11704 }, { "epoch": 0.32, "learning_rate": 1.591314601866695e-05, "loss": 1.2017, "step": 11705 }, { "epoch": 0.32, "learning_rate": 1.5912432692695167e-05, "loss": 1.4094, "step": 11706 }, { "epoch": 0.32, "learning_rate": 1.5911719320467293e-05, "loss": 1.4863, "step": 11707 }, { "epoch": 0.32, "learning_rate": 1.5911005901988907e-05, "loss": 1.4841, "step": 11708 }, { "epoch": 0.32, "learning_rate": 1.5910292437265588e-05, "loss": 1.3643, "step": 11709 }, { "epoch": 0.32, "learning_rate": 1.590957892630292e-05, "loss": 1.3989, "step": 11710 }, { "epoch": 0.32, "learning_rate": 1.5908865369106486e-05, "loss": 1.3755, "step": 11711 }, { "epoch": 0.32, "learning_rate": 1.590815176568187e-05, "loss": 1.3159, "step": 11712 }, { "epoch": 0.32, "learning_rate": 1.5907438116034654e-05, "loss": 1.4092, "step": 11713 }, { "epoch": 0.32, "learning_rate": 1.5906724420170416e-05, "loss": 1.3206, "step": 11714 }, { "epoch": 0.32, "learning_rate": 1.5906010678094744e-05, "loss": 1.314, "step": 11715 }, { "epoch": 0.32, "learning_rate": 1.5905296889813225e-05, "loss": 1.3164, "step": 11716 }, { "epoch": 0.32, "learning_rate": 1.5904583055331438e-05, "loss": 1.4141, "step": 11717 }, { "epoch": 0.32, "learning_rate": 1.590386917465497e-05, "loss": 1.2449, "step": 11718 }, { "epoch": 0.32, "learning_rate": 1.5903155247789403e-05, "loss": 1.2439, "step": 11719 }, { "epoch": 0.32, "learning_rate": 1.590244127474033e-05, "loss": 1.29, "step": 11720 }, { "epoch": 0.32, "learning_rate": 1.5901727255513327e-05, "loss": 1.3311, "step": 11721 }, { "epoch": 0.32, "learning_rate": 1.5901013190113988e-05, "loss": 1.2095, "step": 11722 }, { "epoch": 0.32, "learning_rate": 1.5900299078547898e-05, "loss": 1.3745, "step": 11723 }, { "epoch": 0.32, "learning_rate": 1.5899584920820642e-05, "loss": 1.4375, "step": 11724 }, { "epoch": 0.32, "learning_rate": 1.5898870716937807e-05, "loss": 1.4351, "step": 11725 }, { "epoch": 0.32, "learning_rate": 1.589815646690498e-05, "loss": 1.363, "step": 11726 }, { "epoch": 0.32, "learning_rate": 1.5897442170727754e-05, "loss": 1.28, "step": 11727 }, { "epoch": 0.32, "learning_rate": 1.5896727828411707e-05, "loss": 1.2991, "step": 11728 }, { "epoch": 0.32, "learning_rate": 1.5896013439962442e-05, "loss": 1.4136, "step": 11729 }, { "epoch": 0.32, "learning_rate": 1.5895299005385534e-05, "loss": 1.4102, "step": 11730 }, { "epoch": 0.32, "learning_rate": 1.589458452468658e-05, "loss": 1.2196, "step": 11731 }, { "epoch": 0.32, "learning_rate": 1.589386999787117e-05, "loss": 1.2922, "step": 11732 }, { "epoch": 0.32, "learning_rate": 1.5893155424944896e-05, "loss": 1.415, "step": 11733 }, { "epoch": 0.32, "learning_rate": 1.589244080591334e-05, "loss": 1.3291, "step": 11734 }, { "epoch": 0.32, "learning_rate": 1.5891726140782097e-05, "loss": 1.2266, "step": 11735 }, { "epoch": 0.32, "learning_rate": 1.5891011429556765e-05, "loss": 1.4792, "step": 11736 }, { "epoch": 0.32, "learning_rate": 1.5890296672242926e-05, "loss": 1.5269, "step": 11737 }, { "epoch": 0.32, "learning_rate": 1.5889581868846176e-05, "loss": 1.2527, "step": 11738 }, { "epoch": 0.32, "learning_rate": 1.5888867019372107e-05, "loss": 1.4644, "step": 11739 }, { "epoch": 0.32, "learning_rate": 1.5888152123826314e-05, "loss": 1.3579, "step": 11740 }, { "epoch": 0.32, "learning_rate": 1.5887437182214386e-05, "loss": 1.2185, "step": 11741 }, { "epoch": 0.32, "learning_rate": 1.5886722194541914e-05, "loss": 1.3232, "step": 11742 }, { "epoch": 0.32, "learning_rate": 1.58860071608145e-05, "loss": 1.4795, "step": 11743 }, { "epoch": 0.32, "learning_rate": 1.5885292081037733e-05, "loss": 1.4258, "step": 11744 }, { "epoch": 0.32, "learning_rate": 1.588457695521721e-05, "loss": 1.3423, "step": 11745 }, { "epoch": 0.32, "learning_rate": 1.5883861783358518e-05, "loss": 1.1917, "step": 11746 }, { "epoch": 0.32, "learning_rate": 1.5883146565467262e-05, "loss": 1.2974, "step": 11747 }, { "epoch": 0.32, "learning_rate": 1.5882431301549032e-05, "loss": 1.2407, "step": 11748 }, { "epoch": 0.32, "learning_rate": 1.588171599160943e-05, "loss": 1.4802, "step": 11749 }, { "epoch": 0.32, "learning_rate": 1.5881000635654045e-05, "loss": 1.3789, "step": 11750 }, { "epoch": 0.32, "learning_rate": 1.5880285233688476e-05, "loss": 1.324, "step": 11751 }, { "epoch": 0.32, "learning_rate": 1.5879569785718324e-05, "loss": 1.3069, "step": 11752 }, { "epoch": 0.32, "learning_rate": 1.5878854291749178e-05, "loss": 1.3223, "step": 11753 }, { "epoch": 0.32, "learning_rate": 1.5878138751786644e-05, "loss": 1.2129, "step": 11754 }, { "epoch": 0.32, "learning_rate": 1.5877423165836313e-05, "loss": 1.377, "step": 11755 }, { "epoch": 0.32, "learning_rate": 1.587670753390379e-05, "loss": 1.2625, "step": 11756 }, { "epoch": 0.32, "learning_rate": 1.587599185599467e-05, "loss": 1.4219, "step": 11757 }, { "epoch": 0.32, "learning_rate": 1.5875276132114552e-05, "loss": 1.3784, "step": 11758 }, { "epoch": 0.32, "learning_rate": 1.5874560362269035e-05, "loss": 1.2842, "step": 11759 }, { "epoch": 0.32, "learning_rate": 1.5873844546463723e-05, "loss": 1.4583, "step": 11760 }, { "epoch": 0.32, "learning_rate": 1.5873128684704215e-05, "loss": 1.1863, "step": 11761 }, { "epoch": 0.32, "learning_rate": 1.5872412776996106e-05, "loss": 1.1152, "step": 11762 }, { "epoch": 0.32, "learning_rate": 1.5871696823344998e-05, "loss": 1.4077, "step": 11763 }, { "epoch": 0.32, "learning_rate": 1.5870980823756502e-05, "loss": 1.5142, "step": 11764 }, { "epoch": 0.32, "learning_rate": 1.5870264778236207e-05, "loss": 1.2449, "step": 11765 }, { "epoch": 0.32, "learning_rate": 1.5869548686789725e-05, "loss": 1.4146, "step": 11766 }, { "epoch": 0.32, "learning_rate": 1.5868832549422653e-05, "loss": 1.3838, "step": 11767 }, { "epoch": 0.32, "learning_rate": 1.5868116366140595e-05, "loss": 1.2998, "step": 11768 }, { "epoch": 0.32, "learning_rate": 1.5867400136949154e-05, "loss": 1.4148, "step": 11769 }, { "epoch": 0.32, "learning_rate": 1.5866683861853932e-05, "loss": 1.3464, "step": 11770 }, { "epoch": 0.32, "learning_rate": 1.5865967540860535e-05, "loss": 1.4353, "step": 11771 }, { "epoch": 0.32, "learning_rate": 1.5865251173974565e-05, "loss": 1.2686, "step": 11772 }, { "epoch": 0.32, "learning_rate": 1.5864534761201628e-05, "loss": 1.3975, "step": 11773 }, { "epoch": 0.32, "learning_rate": 1.5863818302547333e-05, "loss": 1.406, "step": 11774 }, { "epoch": 0.32, "learning_rate": 1.5863101798017275e-05, "loss": 1.3918, "step": 11775 }, { "epoch": 0.32, "learning_rate": 1.586238524761707e-05, "loss": 1.4009, "step": 11776 }, { "epoch": 0.32, "learning_rate": 1.5861668651352317e-05, "loss": 1.4434, "step": 11777 }, { "epoch": 0.32, "learning_rate": 1.5860952009228625e-05, "loss": 1.3384, "step": 11778 }, { "epoch": 0.32, "learning_rate": 1.58602353212516e-05, "loss": 1.3582, "step": 11779 }, { "epoch": 0.32, "learning_rate": 1.585951858742685e-05, "loss": 1.313, "step": 11780 }, { "epoch": 0.32, "learning_rate": 1.5858801807759984e-05, "loss": 1.3281, "step": 11781 }, { "epoch": 0.32, "learning_rate": 1.5858084982256607e-05, "loss": 1.3357, "step": 11782 }, { "epoch": 0.32, "learning_rate": 1.585736811092233e-05, "loss": 1.2886, "step": 11783 }, { "epoch": 0.32, "learning_rate": 1.5856651193762754e-05, "loss": 1.3376, "step": 11784 }, { "epoch": 0.32, "learning_rate": 1.5855934230783496e-05, "loss": 1.3633, "step": 11785 }, { "epoch": 0.32, "learning_rate": 1.585521722199016e-05, "loss": 1.2734, "step": 11786 }, { "epoch": 0.32, "learning_rate": 1.585450016738836e-05, "loss": 1.3396, "step": 11787 }, { "epoch": 0.32, "learning_rate": 1.5853783066983705e-05, "loss": 1.3179, "step": 11788 }, { "epoch": 0.32, "learning_rate": 1.5853065920781802e-05, "loss": 1.3667, "step": 11789 }, { "epoch": 0.32, "learning_rate": 1.585234872878826e-05, "loss": 1.3645, "step": 11790 }, { "epoch": 0.32, "learning_rate": 1.58516314910087e-05, "loss": 1.1921, "step": 11791 }, { "epoch": 0.32, "learning_rate": 1.5850914207448722e-05, "loss": 1.3376, "step": 11792 }, { "epoch": 0.32, "learning_rate": 1.5850196878113946e-05, "loss": 1.2515, "step": 11793 }, { "epoch": 0.32, "learning_rate": 1.5849479503009978e-05, "loss": 1.1472, "step": 11794 }, { "epoch": 0.32, "learning_rate": 1.5848762082142432e-05, "loss": 1.3047, "step": 11795 }, { "epoch": 0.32, "learning_rate": 1.5848044615516927e-05, "loss": 1.2754, "step": 11796 }, { "epoch": 0.32, "learning_rate": 1.5847327103139065e-05, "loss": 1.3972, "step": 11797 }, { "epoch": 0.32, "learning_rate": 1.584660954501447e-05, "loss": 1.3552, "step": 11798 }, { "epoch": 0.32, "learning_rate": 1.584589194114875e-05, "loss": 1.2893, "step": 11799 }, { "epoch": 0.32, "learning_rate": 1.5845174291547518e-05, "loss": 1.468, "step": 11800 }, { "epoch": 0.32, "learning_rate": 1.5844456596216392e-05, "loss": 1.3682, "step": 11801 }, { "epoch": 0.32, "learning_rate": 1.5843738855160987e-05, "loss": 1.4517, "step": 11802 }, { "epoch": 0.32, "learning_rate": 1.5843021068386914e-05, "loss": 1.3738, "step": 11803 }, { "epoch": 0.32, "learning_rate": 1.5842303235899798e-05, "loss": 1.5125, "step": 11804 }, { "epoch": 0.32, "learning_rate": 1.5841585357705242e-05, "loss": 1.3069, "step": 11805 }, { "epoch": 0.32, "learning_rate": 1.5840867433808872e-05, "loss": 1.2546, "step": 11806 }, { "epoch": 0.32, "learning_rate": 1.5840149464216303e-05, "loss": 1.3755, "step": 11807 }, { "epoch": 0.32, "learning_rate": 1.583943144893315e-05, "loss": 1.3213, "step": 11808 }, { "epoch": 0.32, "learning_rate": 1.5838713387965027e-05, "loss": 1.4658, "step": 11809 }, { "epoch": 0.32, "learning_rate": 1.583799528131756e-05, "loss": 1.2502, "step": 11810 }, { "epoch": 0.32, "learning_rate": 1.5837277128996364e-05, "loss": 1.231, "step": 11811 }, { "epoch": 0.32, "learning_rate": 1.5836558931007057e-05, "loss": 1.377, "step": 11812 }, { "epoch": 0.32, "learning_rate": 1.5835840687355254e-05, "loss": 1.3999, "step": 11813 }, { "epoch": 0.32, "learning_rate": 1.583512239804658e-05, "loss": 1.3047, "step": 11814 }, { "epoch": 0.32, "learning_rate": 1.583440406308665e-05, "loss": 1.4165, "step": 11815 }, { "epoch": 0.32, "learning_rate": 1.583368568248109e-05, "loss": 1.2709, "step": 11816 }, { "epoch": 0.32, "learning_rate": 1.5832967256235515e-05, "loss": 1.3716, "step": 11817 }, { "epoch": 0.32, "learning_rate": 1.5832248784355547e-05, "loss": 1.3555, "step": 11818 }, { "epoch": 0.32, "learning_rate": 1.5831530266846808e-05, "loss": 1.3342, "step": 11819 }, { "epoch": 0.32, "learning_rate": 1.5830811703714916e-05, "loss": 1.3955, "step": 11820 }, { "epoch": 0.32, "learning_rate": 1.5830093094965496e-05, "loss": 1.3823, "step": 11821 }, { "epoch": 0.32, "learning_rate": 1.5829374440604167e-05, "loss": 1.1157, "step": 11822 }, { "epoch": 0.32, "learning_rate": 1.582865574063656e-05, "loss": 1.2295, "step": 11823 }, { "epoch": 0.32, "learning_rate": 1.5827936995068285e-05, "loss": 1.4019, "step": 11824 }, { "epoch": 0.32, "learning_rate": 1.5827218203904973e-05, "loss": 1.2161, "step": 11825 }, { "epoch": 0.32, "learning_rate": 1.5826499367152247e-05, "loss": 1.4253, "step": 11826 }, { "epoch": 0.32, "learning_rate": 1.582578048481573e-05, "loss": 1.4321, "step": 11827 }, { "epoch": 0.32, "learning_rate": 1.582506155690104e-05, "loss": 1.4023, "step": 11828 }, { "epoch": 0.32, "learning_rate": 1.5824342583413816e-05, "loss": 1.3979, "step": 11829 }, { "epoch": 0.32, "learning_rate": 1.582362356435967e-05, "loss": 1.4253, "step": 11830 }, { "epoch": 0.32, "learning_rate": 1.5822904499744233e-05, "loss": 1.1628, "step": 11831 }, { "epoch": 0.32, "learning_rate": 1.5822185389573127e-05, "loss": 1.2405, "step": 11832 }, { "epoch": 0.32, "learning_rate": 1.5821466233851985e-05, "loss": 1.3833, "step": 11833 }, { "epoch": 0.32, "learning_rate": 1.5820747032586426e-05, "loss": 1.2532, "step": 11834 }, { "epoch": 0.32, "learning_rate": 1.582002778578208e-05, "loss": 1.3562, "step": 11835 }, { "epoch": 0.32, "learning_rate": 1.581930849344457e-05, "loss": 1.3062, "step": 11836 }, { "epoch": 0.32, "learning_rate": 1.581858915557953e-05, "loss": 1.2834, "step": 11837 }, { "epoch": 0.32, "learning_rate": 1.5817869772192584e-05, "loss": 1.3406, "step": 11838 }, { "epoch": 0.32, "learning_rate": 1.5817150343289363e-05, "loss": 1.3271, "step": 11839 }, { "epoch": 0.32, "learning_rate": 1.5816430868875486e-05, "loss": 1.2632, "step": 11840 }, { "epoch": 0.32, "learning_rate": 1.5815711348956593e-05, "loss": 1.3206, "step": 11841 }, { "epoch": 0.32, "learning_rate": 1.5814991783538313e-05, "loss": 1.4263, "step": 11842 }, { "epoch": 0.32, "learning_rate": 1.581427217262627e-05, "loss": 1.2817, "step": 11843 }, { "epoch": 0.32, "learning_rate": 1.5813552516226092e-05, "loss": 1.3079, "step": 11844 }, { "epoch": 0.32, "learning_rate": 1.5812832814343415e-05, "loss": 1.3557, "step": 11845 }, { "epoch": 0.32, "learning_rate": 1.5812113066983866e-05, "loss": 1.3853, "step": 11846 }, { "epoch": 0.32, "learning_rate": 1.581139327415308e-05, "loss": 1.1987, "step": 11847 }, { "epoch": 0.32, "learning_rate": 1.5810673435856684e-05, "loss": 1.2373, "step": 11848 }, { "epoch": 0.32, "learning_rate": 1.580995355210031e-05, "loss": 1.4194, "step": 11849 }, { "epoch": 0.32, "learning_rate": 1.5809233622889596e-05, "loss": 1.2778, "step": 11850 }, { "epoch": 0.32, "learning_rate": 1.580851364823017e-05, "loss": 1.2004, "step": 11851 }, { "epoch": 0.32, "learning_rate": 1.580779362812766e-05, "loss": 1.3699, "step": 11852 }, { "epoch": 0.32, "learning_rate": 1.5807073562587706e-05, "loss": 1.4824, "step": 11853 }, { "epoch": 0.32, "learning_rate": 1.5806353451615938e-05, "loss": 1.3865, "step": 11854 }, { "epoch": 0.32, "learning_rate": 1.580563329521799e-05, "loss": 1.4214, "step": 11855 }, { "epoch": 0.32, "learning_rate": 1.5804913093399498e-05, "loss": 1.4106, "step": 11856 }, { "epoch": 0.32, "learning_rate": 1.5804192846166095e-05, "loss": 1.3845, "step": 11857 }, { "epoch": 0.32, "learning_rate": 1.580347255352342e-05, "loss": 1.2678, "step": 11858 }, { "epoch": 0.32, "learning_rate": 1.58027522154771e-05, "loss": 1.2529, "step": 11859 }, { "epoch": 0.32, "learning_rate": 1.580203183203278e-05, "loss": 1.52, "step": 11860 }, { "epoch": 0.32, "learning_rate": 1.5801311403196086e-05, "loss": 1.3564, "step": 11861 }, { "epoch": 0.32, "learning_rate": 1.5800590928972663e-05, "loss": 1.4333, "step": 11862 }, { "epoch": 0.32, "learning_rate": 1.5799870409368146e-05, "loss": 1.2666, "step": 11863 }, { "epoch": 0.32, "learning_rate": 1.5799149844388168e-05, "loss": 1.3093, "step": 11864 }, { "epoch": 0.32, "learning_rate": 1.5798429234038368e-05, "loss": 1.4863, "step": 11865 }, { "epoch": 0.32, "learning_rate": 1.5797708578324384e-05, "loss": 1.2405, "step": 11866 }, { "epoch": 0.32, "learning_rate": 1.5796987877251856e-05, "loss": 1.688, "step": 11867 }, { "epoch": 0.32, "learning_rate": 1.579626713082642e-05, "loss": 1.7588, "step": 11868 }, { "epoch": 0.32, "learning_rate": 1.5795546339053717e-05, "loss": 1.5002, "step": 11869 }, { "epoch": 0.32, "learning_rate": 1.579482550193938e-05, "loss": 1.2976, "step": 11870 }, { "epoch": 0.32, "learning_rate": 1.5794104619489058e-05, "loss": 1.3367, "step": 11871 }, { "epoch": 0.32, "learning_rate": 1.5793383691708383e-05, "loss": 1.2822, "step": 11872 }, { "epoch": 0.32, "learning_rate": 1.5792662718603e-05, "loss": 1.3535, "step": 11873 }, { "epoch": 0.32, "learning_rate": 1.5791941700178548e-05, "loss": 1.2263, "step": 11874 }, { "epoch": 0.32, "learning_rate": 1.579122063644067e-05, "loss": 1.2656, "step": 11875 }, { "epoch": 0.32, "learning_rate": 1.5790499527395e-05, "loss": 1.3064, "step": 11876 }, { "epoch": 0.32, "learning_rate": 1.5789778373047187e-05, "loss": 1.4419, "step": 11877 }, { "epoch": 0.32, "learning_rate": 1.578905717340287e-05, "loss": 1.3105, "step": 11878 }, { "epoch": 0.32, "learning_rate": 1.5788335928467693e-05, "loss": 1.2229, "step": 11879 }, { "epoch": 0.32, "learning_rate": 1.5787614638247294e-05, "loss": 1.3179, "step": 11880 }, { "epoch": 0.32, "learning_rate": 1.5786893302747323e-05, "loss": 1.417, "step": 11881 }, { "epoch": 0.32, "learning_rate": 1.578617192197342e-05, "loss": 1.4043, "step": 11882 }, { "epoch": 0.32, "learning_rate": 1.578545049593123e-05, "loss": 1.4971, "step": 11883 }, { "epoch": 0.32, "learning_rate": 1.5784729024626393e-05, "loss": 1.3853, "step": 11884 }, { "epoch": 0.32, "learning_rate": 1.5784007508064557e-05, "loss": 1.3911, "step": 11885 }, { "epoch": 0.32, "learning_rate": 1.5783285946251365e-05, "loss": 1.4139, "step": 11886 }, { "epoch": 0.32, "learning_rate": 1.5782564339192465e-05, "loss": 1.3276, "step": 11887 }, { "epoch": 0.32, "learning_rate": 1.57818426868935e-05, "loss": 1.2358, "step": 11888 }, { "epoch": 0.32, "learning_rate": 1.5781120989360115e-05, "loss": 1.4761, "step": 11889 }, { "epoch": 0.32, "learning_rate": 1.5780399246597962e-05, "loss": 1.3994, "step": 11890 }, { "epoch": 0.32, "learning_rate": 1.5779677458612682e-05, "loss": 1.3645, "step": 11891 }, { "epoch": 0.32, "learning_rate": 1.577895562540992e-05, "loss": 1.377, "step": 11892 }, { "epoch": 0.32, "learning_rate": 1.577823374699533e-05, "loss": 1.4153, "step": 11893 }, { "epoch": 0.32, "learning_rate": 1.5777511823374557e-05, "loss": 1.2302, "step": 11894 }, { "epoch": 0.32, "learning_rate": 1.5776789854553246e-05, "loss": 1.292, "step": 11895 }, { "epoch": 0.32, "learning_rate": 1.5776067840537048e-05, "loss": 1.2683, "step": 11896 }, { "epoch": 0.32, "learning_rate": 1.577534578133161e-05, "loss": 1.1243, "step": 11897 }, { "epoch": 0.32, "learning_rate": 1.5774623676942588e-05, "loss": 1.3186, "step": 11898 }, { "epoch": 0.32, "learning_rate": 1.5773901527375623e-05, "loss": 1.2007, "step": 11899 }, { "epoch": 0.32, "learning_rate": 1.5773179332636363e-05, "loss": 1.291, "step": 11900 }, { "epoch": 0.33, "learning_rate": 1.5772457092730468e-05, "loss": 1.2333, "step": 11901 }, { "epoch": 0.33, "learning_rate": 1.5771734807663577e-05, "loss": 1.467, "step": 11902 }, { "epoch": 0.33, "learning_rate": 1.577101247744135e-05, "loss": 1.3123, "step": 11903 }, { "epoch": 0.33, "learning_rate": 1.577029010206944e-05, "loss": 1.3286, "step": 11904 }, { "epoch": 0.33, "learning_rate": 1.576956768155349e-05, "loss": 1.3518, "step": 11905 }, { "epoch": 0.33, "learning_rate": 1.5768845215899154e-05, "loss": 1.2585, "step": 11906 }, { "epoch": 0.33, "learning_rate": 1.5768122705112085e-05, "loss": 1.3865, "step": 11907 }, { "epoch": 0.33, "learning_rate": 1.576740014919794e-05, "loss": 1.3191, "step": 11908 }, { "epoch": 0.33, "learning_rate": 1.5766677548162366e-05, "loss": 1.3577, "step": 11909 }, { "epoch": 0.33, "learning_rate": 1.576595490201102e-05, "loss": 1.5054, "step": 11910 }, { "epoch": 0.33, "learning_rate": 1.5765232210749553e-05, "loss": 1.4849, "step": 11911 }, { "epoch": 0.33, "learning_rate": 1.576450947438362e-05, "loss": 1.386, "step": 11912 }, { "epoch": 0.33, "learning_rate": 1.5763786692918875e-05, "loss": 1.3489, "step": 11913 }, { "epoch": 0.33, "learning_rate": 1.5763063866360976e-05, "loss": 1.321, "step": 11914 }, { "epoch": 0.33, "learning_rate": 1.5762340994715574e-05, "loss": 1.3616, "step": 11915 }, { "epoch": 0.33, "learning_rate": 1.5761618077988323e-05, "loss": 1.4138, "step": 11916 }, { "epoch": 0.33, "learning_rate": 1.5760895116184887e-05, "loss": 1.3259, "step": 11917 }, { "epoch": 0.33, "learning_rate": 1.576017210931091e-05, "loss": 1.322, "step": 11918 }, { "epoch": 0.33, "learning_rate": 1.575944905737206e-05, "loss": 1.4019, "step": 11919 }, { "epoch": 0.33, "learning_rate": 1.5758725960373986e-05, "loss": 1.2966, "step": 11920 }, { "epoch": 0.33, "learning_rate": 1.5758002818322348e-05, "loss": 1.2764, "step": 11921 }, { "epoch": 0.33, "learning_rate": 1.5757279631222805e-05, "loss": 1.4683, "step": 11922 }, { "epoch": 0.33, "learning_rate": 1.5756556399081014e-05, "loss": 1.4629, "step": 11923 }, { "epoch": 0.33, "learning_rate": 1.575583312190263e-05, "loss": 1.2803, "step": 11924 }, { "epoch": 0.33, "learning_rate": 1.5755109799693318e-05, "loss": 1.4333, "step": 11925 }, { "epoch": 0.33, "learning_rate": 1.575438643245873e-05, "loss": 1.3701, "step": 11926 }, { "epoch": 0.33, "learning_rate": 1.575366302020453e-05, "loss": 1.4482, "step": 11927 }, { "epoch": 0.33, "learning_rate": 1.5752939562936375e-05, "loss": 1.3696, "step": 11928 }, { "epoch": 0.33, "learning_rate": 1.5752216060659928e-05, "loss": 1.2817, "step": 11929 }, { "epoch": 0.33, "learning_rate": 1.5751492513380846e-05, "loss": 1.3193, "step": 11930 }, { "epoch": 0.33, "learning_rate": 1.575076892110479e-05, "loss": 1.3489, "step": 11931 }, { "epoch": 0.33, "learning_rate": 1.5750045283837427e-05, "loss": 1.2771, "step": 11932 }, { "epoch": 0.33, "learning_rate": 1.5749321601584408e-05, "loss": 1.3367, "step": 11933 }, { "epoch": 0.33, "learning_rate": 1.5748597874351402e-05, "loss": 1.2593, "step": 11934 }, { "epoch": 0.33, "learning_rate": 1.5747874102144073e-05, "loss": 1.2944, "step": 11935 }, { "epoch": 0.33, "learning_rate": 1.5747150284968074e-05, "loss": 1.1493, "step": 11936 }, { "epoch": 0.33, "learning_rate": 1.5746426422829076e-05, "loss": 1.2649, "step": 11937 }, { "epoch": 0.33, "learning_rate": 1.574570251573274e-05, "loss": 1.3796, "step": 11938 }, { "epoch": 0.33, "learning_rate": 1.5744978563684728e-05, "loss": 1.2688, "step": 11939 }, { "epoch": 0.33, "learning_rate": 1.574425456669071e-05, "loss": 1.2761, "step": 11940 }, { "epoch": 0.33, "learning_rate": 1.574353052475634e-05, "loss": 1.3965, "step": 11941 }, { "epoch": 0.33, "learning_rate": 1.574280643788729e-05, "loss": 1.3245, "step": 11942 }, { "epoch": 0.33, "learning_rate": 1.5742082306089223e-05, "loss": 1.2234, "step": 11943 }, { "epoch": 0.33, "learning_rate": 1.5741358129367806e-05, "loss": 1.4812, "step": 11944 }, { "epoch": 0.33, "learning_rate": 1.57406339077287e-05, "loss": 1.3389, "step": 11945 }, { "epoch": 0.33, "learning_rate": 1.5739909641177574e-05, "loss": 1.4644, "step": 11946 }, { "epoch": 0.33, "learning_rate": 1.5739185329720096e-05, "loss": 1.3931, "step": 11947 }, { "epoch": 0.33, "learning_rate": 1.573846097336193e-05, "loss": 1.4165, "step": 11948 }, { "epoch": 0.33, "learning_rate": 1.573773657210874e-05, "loss": 1.2881, "step": 11949 }, { "epoch": 0.33, "learning_rate": 1.57370121259662e-05, "loss": 1.1895, "step": 11950 }, { "epoch": 0.33, "learning_rate": 1.5736287634939978e-05, "loss": 1.2205, "step": 11951 }, { "epoch": 0.33, "learning_rate": 1.5735563099035737e-05, "loss": 1.3704, "step": 11952 }, { "epoch": 0.33, "learning_rate": 1.5734838518259143e-05, "loss": 1.2014, "step": 11953 }, { "epoch": 0.33, "learning_rate": 1.5734113892615874e-05, "loss": 1.3076, "step": 11954 }, { "epoch": 0.33, "learning_rate": 1.5733389222111592e-05, "loss": 1.394, "step": 11955 }, { "epoch": 0.33, "learning_rate": 1.573266450675197e-05, "loss": 1.3979, "step": 11956 }, { "epoch": 0.33, "learning_rate": 1.5731939746542677e-05, "loss": 1.3306, "step": 11957 }, { "epoch": 0.33, "learning_rate": 1.5731214941489384e-05, "loss": 1.3958, "step": 11958 }, { "epoch": 0.33, "learning_rate": 1.5730490091597757e-05, "loss": 1.4419, "step": 11959 }, { "epoch": 0.33, "learning_rate": 1.5729765196873473e-05, "loss": 1.4197, "step": 11960 }, { "epoch": 0.33, "learning_rate": 1.57290402573222e-05, "loss": 1.3418, "step": 11961 }, { "epoch": 0.33, "learning_rate": 1.5728315272949605e-05, "loss": 1.4543, "step": 11962 }, { "epoch": 0.33, "learning_rate": 1.5727590243761372e-05, "loss": 1.2751, "step": 11963 }, { "epoch": 0.33, "learning_rate": 1.572686516976316e-05, "loss": 1.22, "step": 11964 }, { "epoch": 0.33, "learning_rate": 1.572614005096065e-05, "loss": 1.3555, "step": 11965 }, { "epoch": 0.33, "learning_rate": 1.5725414887359517e-05, "loss": 1.2769, "step": 11966 }, { "epoch": 0.33, "learning_rate": 1.5724689678965427e-05, "loss": 1.408, "step": 11967 }, { "epoch": 0.33, "learning_rate": 1.5723964425784054e-05, "loss": 1.2795, "step": 11968 }, { "epoch": 0.33, "learning_rate": 1.572323912782108e-05, "loss": 1.2898, "step": 11969 }, { "epoch": 0.33, "learning_rate": 1.5722513785082173e-05, "loss": 1.3433, "step": 11970 }, { "epoch": 0.33, "learning_rate": 1.572178839757301e-05, "loss": 1.3904, "step": 11971 }, { "epoch": 0.33, "learning_rate": 1.5721062965299262e-05, "loss": 1.2383, "step": 11972 }, { "epoch": 0.33, "learning_rate": 1.5720337488266607e-05, "loss": 1.4644, "step": 11973 }, { "epoch": 0.33, "learning_rate": 1.5719611966480725e-05, "loss": 1.3677, "step": 11974 }, { "epoch": 0.33, "learning_rate": 1.5718886399947285e-05, "loss": 1.4302, "step": 11975 }, { "epoch": 0.33, "learning_rate": 1.571816078867197e-05, "loss": 1.3601, "step": 11976 }, { "epoch": 0.33, "learning_rate": 1.5717435132660456e-05, "loss": 1.4048, "step": 11977 }, { "epoch": 0.33, "learning_rate": 1.5716709431918413e-05, "loss": 0.994, "step": 11978 }, { "epoch": 0.33, "learning_rate": 1.5715983686451526e-05, "loss": 1.8638, "step": 11979 }, { "epoch": 0.33, "learning_rate": 1.5715257896265468e-05, "loss": 1.2847, "step": 11980 }, { "epoch": 0.33, "learning_rate": 1.5714532061365922e-05, "loss": 1.4185, "step": 11981 }, { "epoch": 0.33, "learning_rate": 1.5713806181758564e-05, "loss": 1.3269, "step": 11982 }, { "epoch": 0.33, "learning_rate": 1.5713080257449073e-05, "loss": 1.4238, "step": 11983 }, { "epoch": 0.33, "learning_rate": 1.5712354288443128e-05, "loss": 1.4111, "step": 11984 }, { "epoch": 0.33, "learning_rate": 1.5711628274746413e-05, "loss": 1.2517, "step": 11985 }, { "epoch": 0.33, "learning_rate": 1.57109022163646e-05, "loss": 1.3289, "step": 11986 }, { "epoch": 0.33, "learning_rate": 1.5710176113303374e-05, "loss": 1.3657, "step": 11987 }, { "epoch": 0.33, "learning_rate": 1.5709449965568415e-05, "loss": 1.2812, "step": 11988 }, { "epoch": 0.33, "learning_rate": 1.5708723773165403e-05, "loss": 1.4612, "step": 11989 }, { "epoch": 0.33, "learning_rate": 1.5707997536100025e-05, "loss": 1.4238, "step": 11990 }, { "epoch": 0.33, "learning_rate": 1.5707271254377955e-05, "loss": 1.4377, "step": 11991 }, { "epoch": 0.33, "learning_rate": 1.5706544928004882e-05, "loss": 1.3145, "step": 11992 }, { "epoch": 0.33, "learning_rate": 1.570581855698648e-05, "loss": 1.4961, "step": 11993 }, { "epoch": 0.33, "learning_rate": 1.570509214132844e-05, "loss": 1.4231, "step": 11994 }, { "epoch": 0.33, "learning_rate": 1.570436568103644e-05, "loss": 1.3911, "step": 11995 }, { "epoch": 0.33, "learning_rate": 1.5703639176116164e-05, "loss": 1.3687, "step": 11996 }, { "epoch": 0.33, "learning_rate": 1.57029126265733e-05, "loss": 1.4839, "step": 11997 }, { "epoch": 0.33, "learning_rate": 1.570218603241353e-05, "loss": 1.4695, "step": 11998 }, { "epoch": 0.33, "learning_rate": 1.5701459393642536e-05, "loss": 1.3167, "step": 11999 }, { "epoch": 0.33, "learning_rate": 1.5700732710266008e-05, "loss": 1.4236, "step": 12000 }, { "epoch": 0.33, "learning_rate": 1.5700005982289624e-05, "loss": 1.3879, "step": 12001 }, { "epoch": 0.33, "learning_rate": 1.5699279209719073e-05, "loss": 1.3237, "step": 12002 }, { "epoch": 0.33, "learning_rate": 1.5698552392560046e-05, "loss": 1.3203, "step": 12003 }, { "epoch": 0.33, "learning_rate": 1.569782553081822e-05, "loss": 1.334, "step": 12004 }, { "epoch": 0.33, "learning_rate": 1.569709862449929e-05, "loss": 1.4373, "step": 12005 }, { "epoch": 0.33, "learning_rate": 1.5696371673608933e-05, "loss": 1.3218, "step": 12006 }, { "epoch": 0.33, "learning_rate": 1.569564467815285e-05, "loss": 1.3242, "step": 12007 }, { "epoch": 0.33, "learning_rate": 1.5694917638136717e-05, "loss": 1.436, "step": 12008 }, { "epoch": 0.33, "learning_rate": 1.569419055356623e-05, "loss": 1.429, "step": 12009 }, { "epoch": 0.33, "learning_rate": 1.569346342444707e-05, "loss": 1.3672, "step": 12010 }, { "epoch": 0.33, "learning_rate": 1.569273625078493e-05, "loss": 1.3794, "step": 12011 }, { "epoch": 0.33, "learning_rate": 1.56920090325855e-05, "loss": 1.4683, "step": 12012 }, { "epoch": 0.33, "learning_rate": 1.5691281769854468e-05, "loss": 1.4019, "step": 12013 }, { "epoch": 0.33, "learning_rate": 1.5690554462597523e-05, "loss": 1.2571, "step": 12014 }, { "epoch": 0.33, "learning_rate": 1.5689827110820357e-05, "loss": 1.4746, "step": 12015 }, { "epoch": 0.33, "learning_rate": 1.5689099714528655e-05, "loss": 1.3325, "step": 12016 }, { "epoch": 0.33, "learning_rate": 1.5688372273728116e-05, "loss": 1.2654, "step": 12017 }, { "epoch": 0.33, "learning_rate": 1.5687644788424426e-05, "loss": 1.301, "step": 12018 }, { "epoch": 0.33, "learning_rate": 1.568691725862328e-05, "loss": 1.4575, "step": 12019 }, { "epoch": 0.33, "learning_rate": 1.5686189684330365e-05, "loss": 1.2566, "step": 12020 }, { "epoch": 0.33, "learning_rate": 1.5685462065551375e-05, "loss": 1.4014, "step": 12021 }, { "epoch": 0.33, "learning_rate": 1.5684734402292005e-05, "loss": 1.2153, "step": 12022 }, { "epoch": 0.33, "learning_rate": 1.5684006694557944e-05, "loss": 1.3513, "step": 12023 }, { "epoch": 0.33, "learning_rate": 1.568327894235489e-05, "loss": 1.4263, "step": 12024 }, { "epoch": 0.33, "learning_rate": 1.5682551145688532e-05, "loss": 1.3386, "step": 12025 }, { "epoch": 0.33, "learning_rate": 1.5681823304564566e-05, "loss": 1.3184, "step": 12026 }, { "epoch": 0.33, "learning_rate": 1.568109541898869e-05, "loss": 1.4119, "step": 12027 }, { "epoch": 0.33, "learning_rate": 1.5680367488966594e-05, "loss": 1.2957, "step": 12028 }, { "epoch": 0.33, "learning_rate": 1.567963951450397e-05, "loss": 1.3904, "step": 12029 }, { "epoch": 0.33, "learning_rate": 1.567891149560652e-05, "loss": 1.2771, "step": 12030 }, { "epoch": 0.33, "learning_rate": 1.5678183432279936e-05, "loss": 1.3386, "step": 12031 }, { "epoch": 0.33, "learning_rate": 1.5677455324529917e-05, "loss": 1.3535, "step": 12032 }, { "epoch": 0.33, "learning_rate": 1.5676727172362154e-05, "loss": 1.333, "step": 12033 }, { "epoch": 0.33, "learning_rate": 1.5675998975782346e-05, "loss": 1.3413, "step": 12034 }, { "epoch": 0.33, "learning_rate": 1.5675270734796196e-05, "loss": 1.2708, "step": 12035 }, { "epoch": 0.33, "learning_rate": 1.5674542449409392e-05, "loss": 1.2993, "step": 12036 }, { "epoch": 0.33, "learning_rate": 1.5673814119627636e-05, "loss": 1.3555, "step": 12037 }, { "epoch": 0.33, "learning_rate": 1.567308574545663e-05, "loss": 1.2966, "step": 12038 }, { "epoch": 0.33, "learning_rate": 1.567235732690207e-05, "loss": 1.2358, "step": 12039 }, { "epoch": 0.33, "learning_rate": 1.567162886396965e-05, "loss": 1.3037, "step": 12040 }, { "epoch": 0.33, "learning_rate": 1.5670900356665072e-05, "loss": 1.3308, "step": 12041 }, { "epoch": 0.33, "learning_rate": 1.567017180499404e-05, "loss": 1.3704, "step": 12042 }, { "epoch": 0.33, "learning_rate": 1.5669443208962246e-05, "loss": 1.3809, "step": 12043 }, { "epoch": 0.33, "learning_rate": 1.5668714568575395e-05, "loss": 1.2673, "step": 12044 }, { "epoch": 0.33, "learning_rate": 1.566798588383919e-05, "loss": 1.3477, "step": 12045 }, { "epoch": 0.33, "learning_rate": 1.5667257154759327e-05, "loss": 1.3118, "step": 12046 }, { "epoch": 0.33, "learning_rate": 1.5666528381341507e-05, "loss": 1.3557, "step": 12047 }, { "epoch": 0.33, "learning_rate": 1.5665799563591436e-05, "loss": 1.4153, "step": 12048 }, { "epoch": 0.33, "learning_rate": 1.5665070701514813e-05, "loss": 1.1318, "step": 12049 }, { "epoch": 0.33, "learning_rate": 1.5664341795117343e-05, "loss": 1.2502, "step": 12050 }, { "epoch": 0.33, "learning_rate": 1.5663612844404722e-05, "loss": 1.3574, "step": 12051 }, { "epoch": 0.33, "learning_rate": 1.566288384938266e-05, "loss": 1.3142, "step": 12052 }, { "epoch": 0.33, "learning_rate": 1.5662154810056857e-05, "loss": 1.4326, "step": 12053 }, { "epoch": 0.33, "learning_rate": 1.5661425726433013e-05, "loss": 1.4199, "step": 12054 }, { "epoch": 0.33, "learning_rate": 1.566069659851684e-05, "loss": 1.2236, "step": 12055 }, { "epoch": 0.33, "learning_rate": 1.5659967426314043e-05, "loss": 1.3279, "step": 12056 }, { "epoch": 0.33, "learning_rate": 1.5659238209830317e-05, "loss": 1.4209, "step": 12057 }, { "epoch": 0.33, "learning_rate": 1.5658508949071372e-05, "loss": 1.3848, "step": 12058 }, { "epoch": 0.33, "learning_rate": 1.5657779644042918e-05, "loss": 1.2302, "step": 12059 }, { "epoch": 0.33, "learning_rate": 1.5657050294750653e-05, "loss": 1.2565, "step": 12060 }, { "epoch": 0.33, "learning_rate": 1.5656320901200287e-05, "loss": 1.355, "step": 12061 }, { "epoch": 0.33, "learning_rate": 1.5655591463397528e-05, "loss": 1.4126, "step": 12062 }, { "epoch": 0.33, "learning_rate": 1.5654861981348078e-05, "loss": 1.3501, "step": 12063 }, { "epoch": 0.33, "learning_rate": 1.565413245505765e-05, "loss": 1.4365, "step": 12064 }, { "epoch": 0.33, "learning_rate": 1.5653402884531947e-05, "loss": 1.3411, "step": 12065 }, { "epoch": 0.33, "learning_rate": 1.5652673269776676e-05, "loss": 1.4268, "step": 12066 }, { "epoch": 0.33, "learning_rate": 1.565194361079755e-05, "loss": 1.3062, "step": 12067 }, { "epoch": 0.33, "learning_rate": 1.5651213907600274e-05, "loss": 1.3708, "step": 12068 }, { "epoch": 0.33, "learning_rate": 1.565048416019056e-05, "loss": 1.3149, "step": 12069 }, { "epoch": 0.33, "learning_rate": 1.5649754368574117e-05, "loss": 1.3101, "step": 12070 }, { "epoch": 0.33, "learning_rate": 1.5649024532756647e-05, "loss": 1.2942, "step": 12071 }, { "epoch": 0.33, "learning_rate": 1.5648294652743868e-05, "loss": 1.1468, "step": 12072 }, { "epoch": 0.33, "learning_rate": 1.5647564728541485e-05, "loss": 1.3264, "step": 12073 }, { "epoch": 0.33, "learning_rate": 1.5646834760155214e-05, "loss": 1.4163, "step": 12074 }, { "epoch": 0.33, "learning_rate": 1.564610474759076e-05, "loss": 1.3577, "step": 12075 }, { "epoch": 0.33, "learning_rate": 1.564537469085384e-05, "loss": 1.521, "step": 12076 }, { "epoch": 0.33, "learning_rate": 1.5644644589950163e-05, "loss": 1.291, "step": 12077 }, { "epoch": 0.33, "learning_rate": 1.564391444488544e-05, "loss": 1.4509, "step": 12078 }, { "epoch": 0.33, "learning_rate": 1.5643184255665388e-05, "loss": 1.2244, "step": 12079 }, { "epoch": 0.33, "learning_rate": 1.5642454022295712e-05, "loss": 1.156, "step": 12080 }, { "epoch": 0.33, "learning_rate": 1.564172374478213e-05, "loss": 1.2051, "step": 12081 }, { "epoch": 0.33, "learning_rate": 1.5640993423130354e-05, "loss": 1.3354, "step": 12082 }, { "epoch": 0.33, "learning_rate": 1.5640263057346098e-05, "loss": 1.7837, "step": 12083 }, { "epoch": 0.33, "learning_rate": 1.5639532647435077e-05, "loss": 1.3325, "step": 12084 }, { "epoch": 0.33, "learning_rate": 1.5638802193403008e-05, "loss": 1.3284, "step": 12085 }, { "epoch": 0.33, "learning_rate": 1.5638071695255596e-05, "loss": 1.2659, "step": 12086 }, { "epoch": 0.33, "learning_rate": 1.5637341152998568e-05, "loss": 1.4695, "step": 12087 }, { "epoch": 0.33, "learning_rate": 1.5636610566637628e-05, "loss": 1.2512, "step": 12088 }, { "epoch": 0.33, "learning_rate": 1.56358799361785e-05, "loss": 1.2437, "step": 12089 }, { "epoch": 0.33, "learning_rate": 1.5635149261626898e-05, "loss": 1.2378, "step": 12090 }, { "epoch": 0.33, "learning_rate": 1.5634418542988536e-05, "loss": 1.2957, "step": 12091 }, { "epoch": 0.33, "learning_rate": 1.5633687780269133e-05, "loss": 1.4609, "step": 12092 }, { "epoch": 0.33, "learning_rate": 1.5632956973474408e-05, "loss": 1.2974, "step": 12093 }, { "epoch": 0.33, "learning_rate": 1.5632226122610076e-05, "loss": 1.2048, "step": 12094 }, { "epoch": 0.33, "learning_rate": 1.5631495227681854e-05, "loss": 1.3423, "step": 12095 }, { "epoch": 0.33, "learning_rate": 1.5630764288695464e-05, "loss": 1.3521, "step": 12096 }, { "epoch": 0.33, "learning_rate": 1.5630033305656618e-05, "loss": 1.2122, "step": 12097 }, { "epoch": 0.33, "learning_rate": 1.5629302278571042e-05, "loss": 1.3574, "step": 12098 }, { "epoch": 0.33, "learning_rate": 1.5628571207444453e-05, "loss": 1.1807, "step": 12099 }, { "epoch": 0.33, "learning_rate": 1.562784009228257e-05, "loss": 1.2554, "step": 12100 }, { "epoch": 0.33, "learning_rate": 1.5627108933091105e-05, "loss": 1.3203, "step": 12101 }, { "epoch": 0.33, "learning_rate": 1.5626377729875792e-05, "loss": 1.459, "step": 12102 }, { "epoch": 0.33, "learning_rate": 1.5625646482642346e-05, "loss": 1.4546, "step": 12103 }, { "epoch": 0.33, "learning_rate": 1.5624915191396484e-05, "loss": 1.3113, "step": 12104 }, { "epoch": 0.33, "learning_rate": 1.562418385614393e-05, "loss": 1.3894, "step": 12105 }, { "epoch": 0.33, "learning_rate": 1.562345247689041e-05, "loss": 1.2424, "step": 12106 }, { "epoch": 0.33, "learning_rate": 1.562272105364164e-05, "loss": 1.2241, "step": 12107 }, { "epoch": 0.33, "learning_rate": 1.5621989586403346e-05, "loss": 1.4487, "step": 12108 }, { "epoch": 0.33, "learning_rate": 1.5621258075181246e-05, "loss": 1.3447, "step": 12109 }, { "epoch": 0.33, "learning_rate": 1.562052651998107e-05, "loss": 1.2856, "step": 12110 }, { "epoch": 0.33, "learning_rate": 1.5619794920808534e-05, "loss": 1.499, "step": 12111 }, { "epoch": 0.33, "learning_rate": 1.561906327766937e-05, "loss": 1.2061, "step": 12112 }, { "epoch": 0.33, "learning_rate": 1.561833159056929e-05, "loss": 1.3093, "step": 12113 }, { "epoch": 0.33, "learning_rate": 1.5617599859514034e-05, "loss": 1.3862, "step": 12114 }, { "epoch": 0.33, "learning_rate": 1.5616868084509313e-05, "loss": 1.2988, "step": 12115 }, { "epoch": 0.33, "learning_rate": 1.5616136265560858e-05, "loss": 1.1519, "step": 12116 }, { "epoch": 0.33, "learning_rate": 1.5615404402674395e-05, "loss": 1.1978, "step": 12117 }, { "epoch": 0.33, "learning_rate": 1.5614672495855647e-05, "loss": 1.4001, "step": 12118 }, { "epoch": 0.33, "learning_rate": 1.561394054511034e-05, "loss": 1.3652, "step": 12119 }, { "epoch": 0.33, "learning_rate": 1.5613208550444205e-05, "loss": 1.439, "step": 12120 }, { "epoch": 0.33, "learning_rate": 1.5612476511862963e-05, "loss": 1.3813, "step": 12121 }, { "epoch": 0.33, "learning_rate": 1.5611744429372346e-05, "loss": 1.1807, "step": 12122 }, { "epoch": 0.33, "learning_rate": 1.5611012302978077e-05, "loss": 1.1956, "step": 12123 }, { "epoch": 0.33, "learning_rate": 1.5610280132685892e-05, "loss": 1.4854, "step": 12124 }, { "epoch": 0.33, "learning_rate": 1.560954791850151e-05, "loss": 1.3572, "step": 12125 }, { "epoch": 0.33, "learning_rate": 1.5608815660430664e-05, "loss": 1.3696, "step": 12126 }, { "epoch": 0.33, "learning_rate": 1.560808335847908e-05, "loss": 1.333, "step": 12127 }, { "epoch": 0.33, "learning_rate": 1.560735101265249e-05, "loss": 1.2207, "step": 12128 }, { "epoch": 0.33, "learning_rate": 1.5606618622956622e-05, "loss": 1.1892, "step": 12129 }, { "epoch": 0.33, "learning_rate": 1.5605886189397205e-05, "loss": 1.323, "step": 12130 }, { "epoch": 0.33, "learning_rate": 1.560515371197997e-05, "loss": 1.3633, "step": 12131 }, { "epoch": 0.33, "learning_rate": 1.5604421190710654e-05, "loss": 1.4167, "step": 12132 }, { "epoch": 0.33, "learning_rate": 1.5603688625594975e-05, "loss": 1.2766, "step": 12133 }, { "epoch": 0.33, "learning_rate": 1.5602956016638674e-05, "loss": 1.2832, "step": 12134 }, { "epoch": 0.33, "learning_rate": 1.560222336384748e-05, "loss": 1.4941, "step": 12135 }, { "epoch": 0.33, "learning_rate": 1.5601490667227123e-05, "loss": 1.261, "step": 12136 }, { "epoch": 0.33, "learning_rate": 1.560075792678334e-05, "loss": 1.7568, "step": 12137 }, { "epoch": 0.33, "learning_rate": 1.560002514252186e-05, "loss": 1.385, "step": 12138 }, { "epoch": 0.33, "learning_rate": 1.5599292314448415e-05, "loss": 1.4395, "step": 12139 }, { "epoch": 0.33, "learning_rate": 1.559855944256874e-05, "loss": 1.2214, "step": 12140 }, { "epoch": 0.33, "learning_rate": 1.559782652688857e-05, "loss": 1.3494, "step": 12141 }, { "epoch": 0.33, "learning_rate": 1.5597093567413637e-05, "loss": 1.3513, "step": 12142 }, { "epoch": 0.33, "learning_rate": 1.559636056414968e-05, "loss": 1.2556, "step": 12143 }, { "epoch": 0.33, "learning_rate": 1.559562751710242e-05, "loss": 1.2683, "step": 12144 }, { "epoch": 0.33, "learning_rate": 1.559489442627761e-05, "loss": 1.2556, "step": 12145 }, { "epoch": 0.33, "learning_rate": 1.5594161291680973e-05, "loss": 1.3877, "step": 12146 }, { "epoch": 0.33, "learning_rate": 1.559342811331825e-05, "loss": 1.5098, "step": 12147 }, { "epoch": 0.33, "learning_rate": 1.5592694891195176e-05, "loss": 1.1741, "step": 12148 }, { "epoch": 0.33, "learning_rate": 1.559196162531748e-05, "loss": 1.4185, "step": 12149 }, { "epoch": 0.33, "learning_rate": 1.5591228315690915e-05, "loss": 1.1814, "step": 12150 }, { "epoch": 0.33, "learning_rate": 1.5590494962321202e-05, "loss": 1.1223, "step": 12151 }, { "epoch": 0.33, "learning_rate": 1.5589761565214092e-05, "loss": 1.282, "step": 12152 }, { "epoch": 0.33, "learning_rate": 1.5589028124375312e-05, "loss": 1.2988, "step": 12153 }, { "epoch": 0.33, "learning_rate": 1.5588294639810607e-05, "loss": 1.209, "step": 12154 }, { "epoch": 0.33, "learning_rate": 1.5587561111525707e-05, "loss": 1.2498, "step": 12155 }, { "epoch": 0.33, "learning_rate": 1.5586827539526362e-05, "loss": 1.3115, "step": 12156 }, { "epoch": 0.33, "learning_rate": 1.5586093923818304e-05, "loss": 1.2979, "step": 12157 }, { "epoch": 0.33, "learning_rate": 1.5585360264407273e-05, "loss": 1.2471, "step": 12158 }, { "epoch": 0.33, "learning_rate": 1.5584626561299008e-05, "loss": 1.2942, "step": 12159 }, { "epoch": 0.33, "learning_rate": 1.5583892814499252e-05, "loss": 1.6719, "step": 12160 }, { "epoch": 0.33, "learning_rate": 1.5583159024013748e-05, "loss": 1.3816, "step": 12161 }, { "epoch": 0.33, "learning_rate": 1.558242518984823e-05, "loss": 1.4697, "step": 12162 }, { "epoch": 0.33, "learning_rate": 1.558169131200844e-05, "loss": 1.3809, "step": 12163 }, { "epoch": 0.33, "learning_rate": 1.5580957390500127e-05, "loss": 1.3833, "step": 12164 }, { "epoch": 0.33, "learning_rate": 1.5580223425329022e-05, "loss": 1.325, "step": 12165 }, { "epoch": 0.33, "learning_rate": 1.5579489416500878e-05, "loss": 1.313, "step": 12166 }, { "epoch": 0.33, "learning_rate": 1.557875536402143e-05, "loss": 1.5273, "step": 12167 }, { "epoch": 0.33, "learning_rate": 1.5578021267896426e-05, "loss": 1.3528, "step": 12168 }, { "epoch": 0.33, "learning_rate": 1.55772871281316e-05, "loss": 1.7144, "step": 12169 }, { "epoch": 0.33, "learning_rate": 1.557655294473271e-05, "loss": 1.3799, "step": 12170 }, { "epoch": 0.33, "learning_rate": 1.5575818717705487e-05, "loss": 1.3071, "step": 12171 }, { "epoch": 0.33, "learning_rate": 1.5575084447055684e-05, "loss": 1.2739, "step": 12172 }, { "epoch": 0.33, "learning_rate": 1.557435013278904e-05, "loss": 1.3291, "step": 12173 }, { "epoch": 0.33, "learning_rate": 1.55736157749113e-05, "loss": 1.3528, "step": 12174 }, { "epoch": 0.33, "learning_rate": 1.5572881373428216e-05, "loss": 1.2793, "step": 12175 }, { "epoch": 0.33, "learning_rate": 1.5572146928345524e-05, "loss": 1.4236, "step": 12176 }, { "epoch": 0.33, "learning_rate": 1.5571412439668976e-05, "loss": 1.2312, "step": 12177 }, { "epoch": 0.33, "learning_rate": 1.5570677907404316e-05, "loss": 1.4338, "step": 12178 }, { "epoch": 0.33, "learning_rate": 1.5569943331557294e-05, "loss": 1.6885, "step": 12179 }, { "epoch": 0.33, "learning_rate": 1.5569208712133655e-05, "loss": 1.4167, "step": 12180 }, { "epoch": 0.33, "learning_rate": 1.5568474049139143e-05, "loss": 1.3459, "step": 12181 }, { "epoch": 0.33, "learning_rate": 1.5567739342579508e-05, "loss": 1.2256, "step": 12182 }, { "epoch": 0.33, "learning_rate": 1.55670045924605e-05, "loss": 1.3943, "step": 12183 }, { "epoch": 0.33, "learning_rate": 1.5566269798787864e-05, "loss": 1.438, "step": 12184 }, { "epoch": 0.33, "learning_rate": 1.5565534961567355e-05, "loss": 1.3147, "step": 12185 }, { "epoch": 0.33, "learning_rate": 1.5564800080804714e-05, "loss": 1.2681, "step": 12186 }, { "epoch": 0.33, "learning_rate": 1.5564065156505695e-05, "loss": 1.3157, "step": 12187 }, { "epoch": 0.33, "learning_rate": 1.5563330188676046e-05, "loss": 1.3909, "step": 12188 }, { "epoch": 0.33, "learning_rate": 1.5562595177321518e-05, "loss": 1.3071, "step": 12189 }, { "epoch": 0.33, "learning_rate": 1.556186012244786e-05, "loss": 1.2007, "step": 12190 }, { "epoch": 0.33, "learning_rate": 1.556112502406083e-05, "loss": 1.3613, "step": 12191 }, { "epoch": 0.33, "learning_rate": 1.5560389882166164e-05, "loss": 1.334, "step": 12192 }, { "epoch": 0.33, "learning_rate": 1.5559654696769628e-05, "loss": 1.6111, "step": 12193 }, { "epoch": 0.33, "learning_rate": 1.5558919467876964e-05, "loss": 1.1768, "step": 12194 }, { "epoch": 0.33, "learning_rate": 1.555818419549393e-05, "loss": 1.428, "step": 12195 }, { "epoch": 0.33, "learning_rate": 1.555744887962628e-05, "loss": 1.2686, "step": 12196 }, { "epoch": 0.33, "learning_rate": 1.5556713520279754e-05, "loss": 1.324, "step": 12197 }, { "epoch": 0.33, "learning_rate": 1.5555978117460123e-05, "loss": 1.2878, "step": 12198 }, { "epoch": 0.33, "learning_rate": 1.555524267117313e-05, "loss": 1.3916, "step": 12199 }, { "epoch": 0.33, "learning_rate": 1.555450718142453e-05, "loss": 1.397, "step": 12200 }, { "epoch": 0.33, "learning_rate": 1.555377164822008e-05, "loss": 1.2275, "step": 12201 }, { "epoch": 0.33, "learning_rate": 1.5553036071565526e-05, "loss": 1.2913, "step": 12202 }, { "epoch": 0.33, "learning_rate": 1.5552300451466633e-05, "loss": 1.3962, "step": 12203 }, { "epoch": 0.33, "learning_rate": 1.5551564787929153e-05, "loss": 1.1344, "step": 12204 }, { "epoch": 0.33, "learning_rate": 1.555082908095884e-05, "loss": 1.436, "step": 12205 }, { "epoch": 0.33, "learning_rate": 1.5550093330561448e-05, "loss": 1.238, "step": 12206 }, { "epoch": 0.33, "learning_rate": 1.554935753674274e-05, "loss": 1.2185, "step": 12207 }, { "epoch": 0.33, "learning_rate": 1.5548621699508464e-05, "loss": 1.3564, "step": 12208 }, { "epoch": 0.33, "learning_rate": 1.5547885818864382e-05, "loss": 1.4023, "step": 12209 }, { "epoch": 0.33, "learning_rate": 1.554714989481625e-05, "loss": 1.4502, "step": 12210 }, { "epoch": 0.33, "learning_rate": 1.5546413927369827e-05, "loss": 1.2268, "step": 12211 }, { "epoch": 0.33, "learning_rate": 1.554567791653087e-05, "loss": 1.7998, "step": 12212 }, { "epoch": 0.33, "learning_rate": 1.5544941862305134e-05, "loss": 1.3574, "step": 12213 }, { "epoch": 0.33, "learning_rate": 1.554420576469838e-05, "loss": 1.3423, "step": 12214 }, { "epoch": 0.33, "learning_rate": 1.5543469623716373e-05, "loss": 1.3921, "step": 12215 }, { "epoch": 0.33, "learning_rate": 1.554273343936486e-05, "loss": 1.3057, "step": 12216 }, { "epoch": 0.33, "learning_rate": 1.554199721164961e-05, "loss": 1.1819, "step": 12217 }, { "epoch": 0.33, "learning_rate": 1.554126094057638e-05, "loss": 1.3625, "step": 12218 }, { "epoch": 0.33, "learning_rate": 1.554052462615093e-05, "loss": 1.2637, "step": 12219 }, { "epoch": 0.33, "learning_rate": 1.553978826837902e-05, "loss": 1.3228, "step": 12220 }, { "epoch": 0.33, "learning_rate": 1.5539051867266414e-05, "loss": 1.2563, "step": 12221 }, { "epoch": 0.33, "learning_rate": 1.5538315422818865e-05, "loss": 1.3369, "step": 12222 }, { "epoch": 0.33, "learning_rate": 1.5537578935042142e-05, "loss": 1.4324, "step": 12223 }, { "epoch": 0.33, "learning_rate": 1.5536842403942008e-05, "loss": 1.3081, "step": 12224 }, { "epoch": 0.33, "learning_rate": 1.5536105829524223e-05, "loss": 1.364, "step": 12225 }, { "epoch": 0.33, "learning_rate": 1.553536921179455e-05, "loss": 1.3716, "step": 12226 }, { "epoch": 0.33, "learning_rate": 1.553463255075875e-05, "loss": 1.3625, "step": 12227 }, { "epoch": 0.33, "learning_rate": 1.5533895846422586e-05, "loss": 1.363, "step": 12228 }, { "epoch": 0.33, "learning_rate": 1.553315909879182e-05, "loss": 1.4229, "step": 12229 }, { "epoch": 0.33, "learning_rate": 1.5532422307872225e-05, "loss": 1.4336, "step": 12230 }, { "epoch": 0.33, "learning_rate": 1.5531685473669557e-05, "loss": 1.3093, "step": 12231 }, { "epoch": 0.33, "learning_rate": 1.5530948596189583e-05, "loss": 1.3882, "step": 12232 }, { "epoch": 0.33, "learning_rate": 1.5530211675438068e-05, "loss": 1.3589, "step": 12233 }, { "epoch": 0.33, "learning_rate": 1.552947471142078e-05, "loss": 1.199, "step": 12234 }, { "epoch": 0.33, "learning_rate": 1.552873770414348e-05, "loss": 1.3455, "step": 12235 }, { "epoch": 0.33, "learning_rate": 1.5528000653611935e-05, "loss": 1.2815, "step": 12236 }, { "epoch": 0.33, "learning_rate": 1.5527263559831913e-05, "loss": 1.2795, "step": 12237 }, { "epoch": 0.33, "learning_rate": 1.552652642280918e-05, "loss": 1.3892, "step": 12238 }, { "epoch": 0.33, "learning_rate": 1.5525789242549504e-05, "loss": 1.373, "step": 12239 }, { "epoch": 0.33, "learning_rate": 1.552505201905865e-05, "loss": 1.344, "step": 12240 }, { "epoch": 0.33, "learning_rate": 1.552431475234239e-05, "loss": 1.3, "step": 12241 }, { "epoch": 0.33, "learning_rate": 1.5523577442406486e-05, "loss": 1.2114, "step": 12242 }, { "epoch": 0.33, "learning_rate": 1.552284008925671e-05, "loss": 1.3398, "step": 12243 }, { "epoch": 0.33, "learning_rate": 1.552210269289883e-05, "loss": 1.2417, "step": 12244 }, { "epoch": 0.33, "learning_rate": 1.5521365253338614e-05, "loss": 1.2781, "step": 12245 }, { "epoch": 0.33, "learning_rate": 1.5520627770581836e-05, "loss": 1.3684, "step": 12246 }, { "epoch": 0.33, "learning_rate": 1.5519890244634258e-05, "loss": 1.1554, "step": 12247 }, { "epoch": 0.33, "learning_rate": 1.5519152675501658e-05, "loss": 1.2893, "step": 12248 }, { "epoch": 0.33, "learning_rate": 1.55184150631898e-05, "loss": 1.396, "step": 12249 }, { "epoch": 0.33, "learning_rate": 1.551767740770446e-05, "loss": 1.2075, "step": 12250 }, { "epoch": 0.33, "learning_rate": 1.5516939709051406e-05, "loss": 1.3137, "step": 12251 }, { "epoch": 0.33, "learning_rate": 1.551620196723641e-05, "loss": 1.7178, "step": 12252 }, { "epoch": 0.33, "learning_rate": 1.5515464182265243e-05, "loss": 1.4211, "step": 12253 }, { "epoch": 0.33, "learning_rate": 1.551472635414368e-05, "loss": 1.425, "step": 12254 }, { "epoch": 0.33, "learning_rate": 1.551398848287749e-05, "loss": 1.291, "step": 12255 }, { "epoch": 0.33, "learning_rate": 1.5513250568472443e-05, "loss": 1.3379, "step": 12256 }, { "epoch": 0.33, "learning_rate": 1.551251261093432e-05, "loss": 1.3914, "step": 12257 }, { "epoch": 0.33, "learning_rate": 1.551177461026889e-05, "loss": 1.3557, "step": 12258 }, { "epoch": 0.33, "learning_rate": 1.5511036566481926e-05, "loss": 1.2104, "step": 12259 }, { "epoch": 0.33, "learning_rate": 1.5510298479579203e-05, "loss": 1.3452, "step": 12260 }, { "epoch": 0.33, "learning_rate": 1.5509560349566498e-05, "loss": 1.1638, "step": 12261 }, { "epoch": 0.33, "learning_rate": 1.5508822176449584e-05, "loss": 1.2542, "step": 12262 }, { "epoch": 0.33, "learning_rate": 1.5508083960234233e-05, "loss": 1.3274, "step": 12263 }, { "epoch": 0.33, "learning_rate": 1.5507345700926228e-05, "loss": 1.2468, "step": 12264 }, { "epoch": 0.33, "learning_rate": 1.5506607398531333e-05, "loss": 1.3625, "step": 12265 }, { "epoch": 0.33, "learning_rate": 1.5505869053055337e-05, "loss": 1.3567, "step": 12266 }, { "epoch": 0.34, "learning_rate": 1.550513066450401e-05, "loss": 1.4307, "step": 12267 }, { "epoch": 0.34, "learning_rate": 1.550439223288313e-05, "loss": 1.3008, "step": 12268 }, { "epoch": 0.34, "learning_rate": 1.5503653758198466e-05, "loss": 1.2844, "step": 12269 }, { "epoch": 0.34, "learning_rate": 1.550291524045581e-05, "loss": 1.3528, "step": 12270 }, { "epoch": 0.34, "learning_rate": 1.550217667966093e-05, "loss": 1.4067, "step": 12271 }, { "epoch": 0.34, "learning_rate": 1.5501438075819607e-05, "loss": 1.3682, "step": 12272 }, { "epoch": 0.34, "learning_rate": 1.5500699428937623e-05, "loss": 1.2307, "step": 12273 }, { "epoch": 0.34, "learning_rate": 1.549996073902075e-05, "loss": 1.2712, "step": 12274 }, { "epoch": 0.34, "learning_rate": 1.549922200607477e-05, "loss": 1.447, "step": 12275 }, { "epoch": 0.34, "learning_rate": 1.5498483230105466e-05, "loss": 1.6899, "step": 12276 }, { "epoch": 0.34, "learning_rate": 1.549774441111861e-05, "loss": 1.2957, "step": 12277 }, { "epoch": 0.34, "learning_rate": 1.5497005549119992e-05, "loss": 1.2698, "step": 12278 }, { "epoch": 0.34, "learning_rate": 1.5496266644115386e-05, "loss": 1.405, "step": 12279 }, { "epoch": 0.34, "learning_rate": 1.5495527696110577e-05, "loss": 1.4189, "step": 12280 }, { "epoch": 0.34, "learning_rate": 1.5494788705111337e-05, "loss": 1.3872, "step": 12281 }, { "epoch": 0.34, "learning_rate": 1.5494049671123457e-05, "loss": 1.3447, "step": 12282 }, { "epoch": 0.34, "learning_rate": 1.5493310594152715e-05, "loss": 1.2505, "step": 12283 }, { "epoch": 0.34, "learning_rate": 1.5492571474204896e-05, "loss": 1.28, "step": 12284 }, { "epoch": 0.34, "learning_rate": 1.549183231128578e-05, "loss": 1.5288, "step": 12285 }, { "epoch": 0.34, "learning_rate": 1.549109310540115e-05, "loss": 1.2788, "step": 12286 }, { "epoch": 0.34, "learning_rate": 1.549035385655679e-05, "loss": 1.4941, "step": 12287 }, { "epoch": 0.34, "learning_rate": 1.5489614564758482e-05, "loss": 1.1406, "step": 12288 }, { "epoch": 0.34, "learning_rate": 1.5488875230012012e-05, "loss": 1.3256, "step": 12289 }, { "epoch": 0.34, "learning_rate": 1.5488135852323163e-05, "loss": 1.3032, "step": 12290 }, { "epoch": 0.34, "learning_rate": 1.548739643169772e-05, "loss": 1.407, "step": 12291 }, { "epoch": 0.34, "learning_rate": 1.5486656968141466e-05, "loss": 1.3091, "step": 12292 }, { "epoch": 0.34, "learning_rate": 1.548591746166019e-05, "loss": 1.2466, "step": 12293 }, { "epoch": 0.34, "learning_rate": 1.5485177912259677e-05, "loss": 1.377, "step": 12294 }, { "epoch": 0.34, "learning_rate": 1.548443831994571e-05, "loss": 1.3472, "step": 12295 }, { "epoch": 0.34, "learning_rate": 1.5483698684724077e-05, "loss": 1.4624, "step": 12296 }, { "epoch": 0.34, "learning_rate": 1.548295900660056e-05, "loss": 1.2791, "step": 12297 }, { "epoch": 0.34, "learning_rate": 1.5482219285580954e-05, "loss": 1.26, "step": 12298 }, { "epoch": 0.34, "learning_rate": 1.548147952167104e-05, "loss": 1.4204, "step": 12299 }, { "epoch": 0.34, "learning_rate": 1.548073971487661e-05, "loss": 1.3464, "step": 12300 }, { "epoch": 0.34, "learning_rate": 1.547999986520345e-05, "loss": 1.3938, "step": 12301 }, { "epoch": 0.34, "learning_rate": 1.5479259972657343e-05, "loss": 1.2239, "step": 12302 }, { "epoch": 0.34, "learning_rate": 1.547852003724409e-05, "loss": 1.2703, "step": 12303 }, { "epoch": 0.34, "learning_rate": 1.5477780058969466e-05, "loss": 1.4277, "step": 12304 }, { "epoch": 0.34, "learning_rate": 1.547704003783927e-05, "loss": 1.3813, "step": 12305 }, { "epoch": 0.34, "learning_rate": 1.547629997385929e-05, "loss": 1.5325, "step": 12306 }, { "epoch": 0.34, "learning_rate": 1.5475559867035308e-05, "loss": 1.1675, "step": 12307 }, { "epoch": 0.34, "learning_rate": 1.5474819717373123e-05, "loss": 1.4312, "step": 12308 }, { "epoch": 0.34, "learning_rate": 1.5474079524878525e-05, "loss": 1.2651, "step": 12309 }, { "epoch": 0.34, "learning_rate": 1.5473339289557305e-05, "loss": 1.4038, "step": 12310 }, { "epoch": 0.34, "learning_rate": 1.5472599011415245e-05, "loss": 1.3535, "step": 12311 }, { "epoch": 0.34, "learning_rate": 1.5471858690458146e-05, "loss": 1.3193, "step": 12312 }, { "epoch": 0.34, "learning_rate": 1.54711183266918e-05, "loss": 1.2631, "step": 12313 }, { "epoch": 0.34, "learning_rate": 1.5470377920121998e-05, "loss": 1.3599, "step": 12314 }, { "epoch": 0.34, "learning_rate": 1.5469637470754532e-05, "loss": 1.322, "step": 12315 }, { "epoch": 0.34, "learning_rate": 1.5468896978595188e-05, "loss": 1.4468, "step": 12316 }, { "epoch": 0.34, "learning_rate": 1.5468156443649774e-05, "loss": 1.4185, "step": 12317 }, { "epoch": 0.34, "learning_rate": 1.546741586592407e-05, "loss": 1.1614, "step": 12318 }, { "epoch": 0.34, "learning_rate": 1.5466675245423877e-05, "loss": 1.2495, "step": 12319 }, { "epoch": 0.34, "learning_rate": 1.5465934582154987e-05, "loss": 1.3455, "step": 12320 }, { "epoch": 0.34, "learning_rate": 1.5465193876123192e-05, "loss": 1.2634, "step": 12321 }, { "epoch": 0.34, "learning_rate": 1.5464453127334292e-05, "loss": 1.2925, "step": 12322 }, { "epoch": 0.34, "learning_rate": 1.5463712335794084e-05, "loss": 1.5103, "step": 12323 }, { "epoch": 0.34, "learning_rate": 1.546297150150836e-05, "loss": 1.2766, "step": 12324 }, { "epoch": 0.34, "learning_rate": 1.546223062448291e-05, "loss": 1.321, "step": 12325 }, { "epoch": 0.34, "learning_rate": 1.546148970472354e-05, "loss": 1.3911, "step": 12326 }, { "epoch": 0.34, "learning_rate": 1.5460748742236043e-05, "loss": 1.3086, "step": 12327 }, { "epoch": 0.34, "learning_rate": 1.5460007737026214e-05, "loss": 1.4431, "step": 12328 }, { "epoch": 0.34, "learning_rate": 1.545926668909985e-05, "loss": 1.2915, "step": 12329 }, { "epoch": 0.34, "learning_rate": 1.5458525598462756e-05, "loss": 1.1892, "step": 12330 }, { "epoch": 0.34, "learning_rate": 1.545778446512072e-05, "loss": 1.3218, "step": 12331 }, { "epoch": 0.34, "learning_rate": 1.5457043289079547e-05, "loss": 1.3528, "step": 12332 }, { "epoch": 0.34, "learning_rate": 1.545630207034503e-05, "loss": 1.366, "step": 12333 }, { "epoch": 0.34, "learning_rate": 1.5455560808922975e-05, "loss": 1.4067, "step": 12334 }, { "epoch": 0.34, "learning_rate": 1.5454819504819177e-05, "loss": 1.2974, "step": 12335 }, { "epoch": 0.34, "learning_rate": 1.5454078158039436e-05, "loss": 1.3936, "step": 12336 }, { "epoch": 0.34, "learning_rate": 1.545333676858955e-05, "loss": 1.3955, "step": 12337 }, { "epoch": 0.34, "learning_rate": 1.5452595336475325e-05, "loss": 1.3074, "step": 12338 }, { "epoch": 0.34, "learning_rate": 1.5451853861702557e-05, "loss": 1.4077, "step": 12339 }, { "epoch": 0.34, "learning_rate": 1.5451112344277048e-05, "loss": 1.2966, "step": 12340 }, { "epoch": 0.34, "learning_rate": 1.54503707842046e-05, "loss": 1.3928, "step": 12341 }, { "epoch": 0.34, "learning_rate": 1.5449629181491013e-05, "loss": 1.3899, "step": 12342 }, { "epoch": 0.34, "learning_rate": 1.544888753614209e-05, "loss": 1.3049, "step": 12343 }, { "epoch": 0.34, "learning_rate": 1.5448145848163633e-05, "loss": 1.2966, "step": 12344 }, { "epoch": 0.34, "learning_rate": 1.5447404117561446e-05, "loss": 1.5269, "step": 12345 }, { "epoch": 0.34, "learning_rate": 1.5446662344341324e-05, "loss": 1.415, "step": 12346 }, { "epoch": 0.34, "learning_rate": 1.5445920528509083e-05, "loss": 1.3794, "step": 12347 }, { "epoch": 0.34, "learning_rate": 1.544517867007052e-05, "loss": 1.2361, "step": 12348 }, { "epoch": 0.34, "learning_rate": 1.544443676903144e-05, "loss": 1.2539, "step": 12349 }, { "epoch": 0.34, "learning_rate": 1.544369482539765e-05, "loss": 1.4219, "step": 12350 }, { "epoch": 0.34, "learning_rate": 1.5442952839174948e-05, "loss": 1.2515, "step": 12351 }, { "epoch": 0.34, "learning_rate": 1.544221081036914e-05, "loss": 1.3716, "step": 12352 }, { "epoch": 0.34, "learning_rate": 1.5441468738986038e-05, "loss": 1.3472, "step": 12353 }, { "epoch": 0.34, "learning_rate": 1.544072662503144e-05, "loss": 1.4785, "step": 12354 }, { "epoch": 0.34, "learning_rate": 1.543998446851116e-05, "loss": 1.1162, "step": 12355 }, { "epoch": 0.34, "learning_rate": 1.5439242269430993e-05, "loss": 1.2173, "step": 12356 }, { "epoch": 0.34, "learning_rate": 1.5438500027796756e-05, "loss": 1.4053, "step": 12357 }, { "epoch": 0.34, "learning_rate": 1.5437757743614252e-05, "loss": 1.2346, "step": 12358 }, { "epoch": 0.34, "learning_rate": 1.543701541688929e-05, "loss": 1.4214, "step": 12359 }, { "epoch": 0.34, "learning_rate": 1.5436273047627676e-05, "loss": 1.2998, "step": 12360 }, { "epoch": 0.34, "learning_rate": 1.5435530635835213e-05, "loss": 1.3064, "step": 12361 }, { "epoch": 0.34, "learning_rate": 1.5434788181517718e-05, "loss": 1.4404, "step": 12362 }, { "epoch": 0.34, "learning_rate": 1.5434045684680995e-05, "loss": 1.4299, "step": 12363 }, { "epoch": 0.34, "learning_rate": 1.5433303145330855e-05, "loss": 1.2017, "step": 12364 }, { "epoch": 0.34, "learning_rate": 1.5432560563473106e-05, "loss": 1.4241, "step": 12365 }, { "epoch": 0.34, "learning_rate": 1.5431817939113557e-05, "loss": 1.2781, "step": 12366 }, { "epoch": 0.34, "learning_rate": 1.543107527225802e-05, "loss": 1.3513, "step": 12367 }, { "epoch": 0.34, "learning_rate": 1.54303325629123e-05, "loss": 1.3652, "step": 12368 }, { "epoch": 0.34, "learning_rate": 1.5429589811082215e-05, "loss": 1.4629, "step": 12369 }, { "epoch": 0.34, "learning_rate": 1.5428847016773572e-05, "loss": 1.3582, "step": 12370 }, { "epoch": 0.34, "learning_rate": 1.542810417999218e-05, "loss": 1.4531, "step": 12371 }, { "epoch": 0.34, "learning_rate": 1.5427361300743856e-05, "loss": 1.2656, "step": 12372 }, { "epoch": 0.34, "learning_rate": 1.542661837903441e-05, "loss": 1.4785, "step": 12373 }, { "epoch": 0.34, "learning_rate": 1.5425875414869652e-05, "loss": 1.2869, "step": 12374 }, { "epoch": 0.34, "learning_rate": 1.5425132408255396e-05, "loss": 1.259, "step": 12375 }, { "epoch": 0.34, "learning_rate": 1.5424389359197458e-05, "loss": 1.1826, "step": 12376 }, { "epoch": 0.34, "learning_rate": 1.5423646267701648e-05, "loss": 1.3945, "step": 12377 }, { "epoch": 0.34, "learning_rate": 1.5422903133773776e-05, "loss": 1.354, "step": 12378 }, { "epoch": 0.34, "learning_rate": 1.5422159957419664e-05, "loss": 1.0308, "step": 12379 }, { "epoch": 0.34, "learning_rate": 1.542141673864512e-05, "loss": 1.3042, "step": 12380 }, { "epoch": 0.34, "learning_rate": 1.542067347745596e-05, "loss": 1.2812, "step": 12381 }, { "epoch": 0.34, "learning_rate": 1.5419930173858e-05, "loss": 1.5703, "step": 12382 }, { "epoch": 0.34, "learning_rate": 1.5419186827857058e-05, "loss": 1.3113, "step": 12383 }, { "epoch": 0.34, "learning_rate": 1.5418443439458944e-05, "loss": 1.397, "step": 12384 }, { "epoch": 0.34, "learning_rate": 1.5417700008669477e-05, "loss": 1.3276, "step": 12385 }, { "epoch": 0.34, "learning_rate": 1.541695653549447e-05, "loss": 1.335, "step": 12386 }, { "epoch": 0.34, "learning_rate": 1.5416213019939744e-05, "loss": 1.2812, "step": 12387 }, { "epoch": 0.34, "learning_rate": 1.5415469462011116e-05, "loss": 1.3557, "step": 12388 }, { "epoch": 0.34, "learning_rate": 1.54147258617144e-05, "loss": 1.3413, "step": 12389 }, { "epoch": 0.34, "learning_rate": 1.5413982219055418e-05, "loss": 1.3223, "step": 12390 }, { "epoch": 0.34, "learning_rate": 1.5413238534039983e-05, "loss": 1.7637, "step": 12391 }, { "epoch": 0.34, "learning_rate": 1.5412494806673913e-05, "loss": 1.25, "step": 12392 }, { "epoch": 0.34, "learning_rate": 1.5411751036963034e-05, "loss": 1.3357, "step": 12393 }, { "epoch": 0.34, "learning_rate": 1.5411007224913154e-05, "loss": 1.2202, "step": 12394 }, { "epoch": 0.34, "learning_rate": 1.54102633705301e-05, "loss": 1.3088, "step": 12395 }, { "epoch": 0.34, "learning_rate": 1.540951947381969e-05, "loss": 1.3567, "step": 12396 }, { "epoch": 0.34, "learning_rate": 1.540877553478774e-05, "loss": 1.3232, "step": 12397 }, { "epoch": 0.34, "learning_rate": 1.540803155344008e-05, "loss": 1.394, "step": 12398 }, { "epoch": 0.34, "learning_rate": 1.540728752978252e-05, "loss": 1.2793, "step": 12399 }, { "epoch": 0.34, "learning_rate": 1.5406543463820883e-05, "loss": 1.1782, "step": 12400 }, { "epoch": 0.34, "learning_rate": 1.5405799355560997e-05, "loss": 1.3118, "step": 12401 }, { "epoch": 0.34, "learning_rate": 1.5405055205008678e-05, "loss": 1.3474, "step": 12402 }, { "epoch": 0.34, "learning_rate": 1.5404311012169747e-05, "loss": 1.2446, "step": 12403 }, { "epoch": 0.34, "learning_rate": 1.540356677705003e-05, "loss": 1.2114, "step": 12404 }, { "epoch": 0.34, "learning_rate": 1.5402822499655345e-05, "loss": 1.3811, "step": 12405 }, { "epoch": 0.34, "learning_rate": 1.540207817999152e-05, "loss": 1.1721, "step": 12406 }, { "epoch": 0.34, "learning_rate": 1.540133381806437e-05, "loss": 1.353, "step": 12407 }, { "epoch": 0.34, "learning_rate": 1.540058941387973e-05, "loss": 1.3445, "step": 12408 }, { "epoch": 0.34, "learning_rate": 1.5399844967443412e-05, "loss": 1.4829, "step": 12409 }, { "epoch": 0.34, "learning_rate": 1.5399100478761253e-05, "loss": 1.3938, "step": 12410 }, { "epoch": 0.34, "learning_rate": 1.539835594783907e-05, "loss": 1.4204, "step": 12411 }, { "epoch": 0.34, "learning_rate": 1.5397611374682686e-05, "loss": 1.7485, "step": 12412 }, { "epoch": 0.34, "learning_rate": 1.5396866759297927e-05, "loss": 1.23, "step": 12413 }, { "epoch": 0.34, "learning_rate": 1.5396122101690622e-05, "loss": 1.3196, "step": 12414 }, { "epoch": 0.34, "learning_rate": 1.5395377401866595e-05, "loss": 1.3174, "step": 12415 }, { "epoch": 0.34, "learning_rate": 1.5394632659831674e-05, "loss": 1.2617, "step": 12416 }, { "epoch": 0.34, "learning_rate": 1.539388787559168e-05, "loss": 1.1506, "step": 12417 }, { "epoch": 0.34, "learning_rate": 1.539314304915245e-05, "loss": 1.2864, "step": 12418 }, { "epoch": 0.34, "learning_rate": 1.5392398180519797e-05, "loss": 1.354, "step": 12419 }, { "epoch": 0.34, "learning_rate": 1.539165326969956e-05, "loss": 1.2744, "step": 12420 }, { "epoch": 0.34, "learning_rate": 1.5390908316697566e-05, "loss": 1.5415, "step": 12421 }, { "epoch": 0.34, "learning_rate": 1.539016332151964e-05, "loss": 1.2607, "step": 12422 }, { "epoch": 0.34, "learning_rate": 1.5389418284171607e-05, "loss": 1.2449, "step": 12423 }, { "epoch": 0.34, "learning_rate": 1.53886732046593e-05, "loss": 1.3911, "step": 12424 }, { "epoch": 0.34, "learning_rate": 1.538792808298855e-05, "loss": 1.2917, "step": 12425 }, { "epoch": 0.34, "learning_rate": 1.5387182919165184e-05, "loss": 1.3381, "step": 12426 }, { "epoch": 0.34, "learning_rate": 1.538643771319503e-05, "loss": 1.1897, "step": 12427 }, { "epoch": 0.34, "learning_rate": 1.5385692465083923e-05, "loss": 1.3623, "step": 12428 }, { "epoch": 0.34, "learning_rate": 1.5384947174837688e-05, "loss": 1.3882, "step": 12429 }, { "epoch": 0.34, "learning_rate": 1.5384201842462158e-05, "loss": 1.3545, "step": 12430 }, { "epoch": 0.34, "learning_rate": 1.5383456467963168e-05, "loss": 1.4197, "step": 12431 }, { "epoch": 0.34, "learning_rate": 1.5382711051346545e-05, "loss": 1.1946, "step": 12432 }, { "epoch": 0.34, "learning_rate": 1.538196559261812e-05, "loss": 1.3521, "step": 12433 }, { "epoch": 0.34, "learning_rate": 1.5381220091783727e-05, "loss": 1.217, "step": 12434 }, { "epoch": 0.34, "learning_rate": 1.5380474548849203e-05, "loss": 1.2266, "step": 12435 }, { "epoch": 0.34, "learning_rate": 1.537972896382037e-05, "loss": 1.2117, "step": 12436 }, { "epoch": 0.34, "learning_rate": 1.5378983336703074e-05, "loss": 1.4722, "step": 12437 }, { "epoch": 0.34, "learning_rate": 1.5378237667503134e-05, "loss": 1.2666, "step": 12438 }, { "epoch": 0.34, "learning_rate": 1.53774919562264e-05, "loss": 1.293, "step": 12439 }, { "epoch": 0.34, "learning_rate": 1.5376746202878693e-05, "loss": 1.3477, "step": 12440 }, { "epoch": 0.34, "learning_rate": 1.5376000407465853e-05, "loss": 1.4109, "step": 12441 }, { "epoch": 0.34, "learning_rate": 1.537525456999371e-05, "loss": 1.2625, "step": 12442 }, { "epoch": 0.34, "learning_rate": 1.5374508690468108e-05, "loss": 1.0898, "step": 12443 }, { "epoch": 0.34, "learning_rate": 1.537376276889487e-05, "loss": 1.3743, "step": 12444 }, { "epoch": 0.34, "learning_rate": 1.5373016805279844e-05, "loss": 1.3962, "step": 12445 }, { "epoch": 0.34, "learning_rate": 1.5372270799628863e-05, "loss": 1.2454, "step": 12446 }, { "epoch": 0.34, "learning_rate": 1.537152475194776e-05, "loss": 1.4092, "step": 12447 }, { "epoch": 0.34, "learning_rate": 1.537077866224237e-05, "loss": 1.4111, "step": 12448 }, { "epoch": 0.34, "learning_rate": 1.537003253051854e-05, "loss": 1.3447, "step": 12449 }, { "epoch": 0.34, "learning_rate": 1.5369286356782092e-05, "loss": 1.3853, "step": 12450 }, { "epoch": 0.34, "learning_rate": 1.536854014103888e-05, "loss": 1.2798, "step": 12451 }, { "epoch": 0.34, "learning_rate": 1.5367793883294732e-05, "loss": 1.375, "step": 12452 }, { "epoch": 0.34, "learning_rate": 1.536704758355549e-05, "loss": 1.3992, "step": 12453 }, { "epoch": 0.34, "learning_rate": 1.5366301241826987e-05, "loss": 1.2275, "step": 12454 }, { "epoch": 0.34, "learning_rate": 1.536555485811507e-05, "loss": 1.4536, "step": 12455 }, { "epoch": 0.34, "learning_rate": 1.5364808432425574e-05, "loss": 1.1121, "step": 12456 }, { "epoch": 0.34, "learning_rate": 1.536406196476434e-05, "loss": 1.3552, "step": 12457 }, { "epoch": 0.34, "learning_rate": 1.5363315455137206e-05, "loss": 1.3809, "step": 12458 }, { "epoch": 0.34, "learning_rate": 1.5362568903550018e-05, "loss": 1.3362, "step": 12459 }, { "epoch": 0.34, "learning_rate": 1.5361822310008607e-05, "loss": 1.3049, "step": 12460 }, { "epoch": 0.34, "learning_rate": 1.536107567451882e-05, "loss": 1.2002, "step": 12461 }, { "epoch": 0.34, "learning_rate": 1.53603289970865e-05, "loss": 1.312, "step": 12462 }, { "epoch": 0.34, "learning_rate": 1.5359582277717487e-05, "loss": 1.3792, "step": 12463 }, { "epoch": 0.34, "learning_rate": 1.5358835516417623e-05, "loss": 1.6353, "step": 12464 }, { "epoch": 0.34, "learning_rate": 1.5358088713192748e-05, "loss": 1.3982, "step": 12465 }, { "epoch": 0.34, "learning_rate": 1.535734186804871e-05, "loss": 1.2012, "step": 12466 }, { "epoch": 0.34, "learning_rate": 1.5356594980991345e-05, "loss": 1.3135, "step": 12467 }, { "epoch": 0.34, "learning_rate": 1.53558480520265e-05, "loss": 1.2878, "step": 12468 }, { "epoch": 0.34, "learning_rate": 1.535510108116002e-05, "loss": 1.3584, "step": 12469 }, { "epoch": 0.34, "learning_rate": 1.5354354068397745e-05, "loss": 1.3213, "step": 12470 }, { "epoch": 0.34, "learning_rate": 1.5353607013745523e-05, "loss": 1.7627, "step": 12471 }, { "epoch": 0.34, "learning_rate": 1.5352859917209198e-05, "loss": 1.2925, "step": 12472 }, { "epoch": 0.34, "learning_rate": 1.5352112778794612e-05, "loss": 1.3752, "step": 12473 }, { "epoch": 0.34, "learning_rate": 1.5351365598507613e-05, "loss": 1.3296, "step": 12474 }, { "epoch": 0.34, "learning_rate": 1.5350618376354046e-05, "loss": 1.2693, "step": 12475 }, { "epoch": 0.34, "learning_rate": 1.5349871112339755e-05, "loss": 1.2095, "step": 12476 }, { "epoch": 0.34, "learning_rate": 1.534912380647059e-05, "loss": 1.3481, "step": 12477 }, { "epoch": 0.34, "learning_rate": 1.53483764587524e-05, "loss": 1.3179, "step": 12478 }, { "epoch": 0.34, "learning_rate": 1.5347629069191023e-05, "loss": 1.2905, "step": 12479 }, { "epoch": 0.34, "learning_rate": 1.534688163779231e-05, "loss": 1.3049, "step": 12480 }, { "epoch": 0.34, "learning_rate": 1.534613416456211e-05, "loss": 1.2671, "step": 12481 }, { "epoch": 0.34, "learning_rate": 1.5345386649506272e-05, "loss": 1.2957, "step": 12482 }, { "epoch": 0.34, "learning_rate": 1.534463909263064e-05, "loss": 1.2229, "step": 12483 }, { "epoch": 0.34, "learning_rate": 1.534389149394107e-05, "loss": 1.2759, "step": 12484 }, { "epoch": 0.34, "learning_rate": 1.5343143853443397e-05, "loss": 1.4404, "step": 12485 }, { "epoch": 0.34, "learning_rate": 1.5342396171143488e-05, "loss": 1.2327, "step": 12486 }, { "epoch": 0.34, "learning_rate": 1.5341648447047178e-05, "loss": 1.3245, "step": 12487 }, { "epoch": 0.34, "learning_rate": 1.5340900681160326e-05, "loss": 1.4207, "step": 12488 }, { "epoch": 0.34, "learning_rate": 1.5340152873488772e-05, "loss": 1.2151, "step": 12489 }, { "epoch": 0.34, "learning_rate": 1.533940502403838e-05, "loss": 1.3552, "step": 12490 }, { "epoch": 0.34, "learning_rate": 1.533865713281499e-05, "loss": 1.2239, "step": 12491 }, { "epoch": 0.34, "learning_rate": 1.533790919982446e-05, "loss": 1.4043, "step": 12492 }, { "epoch": 0.34, "learning_rate": 1.5337161225072635e-05, "loss": 1.2861, "step": 12493 }, { "epoch": 0.34, "learning_rate": 1.5336413208565373e-05, "loss": 1.3655, "step": 12494 }, { "epoch": 0.34, "learning_rate": 1.5335665150308525e-05, "loss": 1.3232, "step": 12495 }, { "epoch": 0.34, "learning_rate": 1.5334917050307937e-05, "loss": 1.3743, "step": 12496 }, { "epoch": 0.34, "learning_rate": 1.533416890856947e-05, "loss": 1.4824, "step": 12497 }, { "epoch": 0.34, "learning_rate": 1.5333420725098973e-05, "loss": 1.4238, "step": 12498 }, { "epoch": 0.34, "learning_rate": 1.5332672499902298e-05, "loss": 1.3716, "step": 12499 }, { "epoch": 0.34, "learning_rate": 1.5331924232985303e-05, "loss": 1.2959, "step": 12500 }, { "epoch": 0.34, "learning_rate": 1.5331175924353843e-05, "loss": 1.3469, "step": 12501 }, { "epoch": 0.34, "learning_rate": 1.5330427574013763e-05, "loss": 1.2598, "step": 12502 }, { "epoch": 0.34, "learning_rate": 1.532967918197093e-05, "loss": 1.3088, "step": 12503 }, { "epoch": 0.34, "learning_rate": 1.5328930748231193e-05, "loss": 1.2378, "step": 12504 }, { "epoch": 0.34, "learning_rate": 1.5328182272800406e-05, "loss": 1.4067, "step": 12505 }, { "epoch": 0.34, "learning_rate": 1.5327433755684424e-05, "loss": 1.376, "step": 12506 }, { "epoch": 0.34, "learning_rate": 1.5326685196889104e-05, "loss": 1.2957, "step": 12507 }, { "epoch": 0.34, "learning_rate": 1.532593659642031e-05, "loss": 1.1689, "step": 12508 }, { "epoch": 0.34, "learning_rate": 1.5325187954283888e-05, "loss": 1.2744, "step": 12509 }, { "epoch": 0.34, "learning_rate": 1.5324439270485703e-05, "loss": 1.2292, "step": 12510 }, { "epoch": 0.34, "learning_rate": 1.5323690545031606e-05, "loss": 1.3833, "step": 12511 }, { "epoch": 0.34, "learning_rate": 1.532294177792746e-05, "loss": 1.4624, "step": 12512 }, { "epoch": 0.34, "learning_rate": 1.532219296917912e-05, "loss": 1.262, "step": 12513 }, { "epoch": 0.34, "learning_rate": 1.5321444118792443e-05, "loss": 1.3833, "step": 12514 }, { "epoch": 0.34, "learning_rate": 1.532069522677329e-05, "loss": 1.4111, "step": 12515 }, { "epoch": 0.34, "learning_rate": 1.5319946293127523e-05, "loss": 1.3879, "step": 12516 }, { "epoch": 0.34, "learning_rate": 1.531919731786099e-05, "loss": 1.208, "step": 12517 }, { "epoch": 0.34, "learning_rate": 1.5318448300979568e-05, "loss": 1.376, "step": 12518 }, { "epoch": 0.34, "learning_rate": 1.5317699242489102e-05, "loss": 1.2566, "step": 12519 }, { "epoch": 0.34, "learning_rate": 1.531695014239546e-05, "loss": 1.2007, "step": 12520 }, { "epoch": 0.34, "learning_rate": 1.5316201000704494e-05, "loss": 1.3516, "step": 12521 }, { "epoch": 0.34, "learning_rate": 1.531545181742208e-05, "loss": 1.3782, "step": 12522 }, { "epoch": 0.34, "learning_rate": 1.531470259255406e-05, "loss": 1.3833, "step": 12523 }, { "epoch": 0.34, "learning_rate": 1.531395332610632e-05, "loss": 1.1726, "step": 12524 }, { "epoch": 0.34, "learning_rate": 1.5313204018084698e-05, "loss": 1.2976, "step": 12525 }, { "epoch": 0.34, "learning_rate": 1.531245466849507e-05, "loss": 1.3079, "step": 12526 }, { "epoch": 0.34, "learning_rate": 1.531170527734329e-05, "loss": 1.2986, "step": 12527 }, { "epoch": 0.34, "learning_rate": 1.531095584463523e-05, "loss": 1.3423, "step": 12528 }, { "epoch": 0.34, "learning_rate": 1.531020637037675e-05, "loss": 1.2222, "step": 12529 }, { "epoch": 0.34, "learning_rate": 1.5309456854573708e-05, "loss": 1.3606, "step": 12530 }, { "epoch": 0.34, "learning_rate": 1.5308707297231976e-05, "loss": 1.3801, "step": 12531 }, { "epoch": 0.34, "learning_rate": 1.5307957698357413e-05, "loss": 1.3459, "step": 12532 }, { "epoch": 0.34, "learning_rate": 1.5307208057955888e-05, "loss": 1.282, "step": 12533 }, { "epoch": 0.34, "learning_rate": 1.530645837603326e-05, "loss": 1.2607, "step": 12534 }, { "epoch": 0.34, "learning_rate": 1.5305708652595396e-05, "loss": 1.175, "step": 12535 }, { "epoch": 0.34, "learning_rate": 1.5304958887648162e-05, "loss": 1.4707, "step": 12536 }, { "epoch": 0.34, "learning_rate": 1.5304209081197425e-05, "loss": 1.3462, "step": 12537 }, { "epoch": 0.34, "learning_rate": 1.5303459233249053e-05, "loss": 1.4827, "step": 12538 }, { "epoch": 0.34, "learning_rate": 1.5302709343808908e-05, "loss": 1.1768, "step": 12539 }, { "epoch": 0.34, "learning_rate": 1.5301959412882857e-05, "loss": 1.4028, "step": 12540 }, { "epoch": 0.34, "learning_rate": 1.5301209440476773e-05, "loss": 1.4746, "step": 12541 }, { "epoch": 0.34, "learning_rate": 1.5300459426596514e-05, "loss": 1.2109, "step": 12542 }, { "epoch": 0.34, "learning_rate": 1.5299709371247954e-05, "loss": 1.3523, "step": 12543 }, { "epoch": 0.34, "learning_rate": 1.529895927443696e-05, "loss": 1.1865, "step": 12544 }, { "epoch": 0.34, "learning_rate": 1.5298209136169403e-05, "loss": 1.3237, "step": 12545 }, { "epoch": 0.34, "learning_rate": 1.5297458956451148e-05, "loss": 1.1946, "step": 12546 }, { "epoch": 0.34, "learning_rate": 1.5296708735288065e-05, "loss": 1.2032, "step": 12547 }, { "epoch": 0.34, "learning_rate": 1.529595847268602e-05, "loss": 1.4326, "step": 12548 }, { "epoch": 0.34, "learning_rate": 1.529520816865089e-05, "loss": 1.4631, "step": 12549 }, { "epoch": 0.34, "learning_rate": 1.5294457823188543e-05, "loss": 1.4333, "step": 12550 }, { "epoch": 0.34, "learning_rate": 1.5293707436304846e-05, "loss": 1.2852, "step": 12551 }, { "epoch": 0.34, "learning_rate": 1.5292957008005667e-05, "loss": 1.3999, "step": 12552 }, { "epoch": 0.34, "learning_rate": 1.5292206538296887e-05, "loss": 1.3135, "step": 12553 }, { "epoch": 0.34, "learning_rate": 1.5291456027184368e-05, "loss": 1.3899, "step": 12554 }, { "epoch": 0.34, "learning_rate": 1.5290705474673987e-05, "loss": 1.2886, "step": 12555 }, { "epoch": 0.34, "learning_rate": 1.5289954880771616e-05, "loss": 1.3308, "step": 12556 }, { "epoch": 0.34, "learning_rate": 1.528920424548312e-05, "loss": 1.4517, "step": 12557 }, { "epoch": 0.34, "learning_rate": 1.5288453568814384e-05, "loss": 1.4048, "step": 12558 }, { "epoch": 0.34, "learning_rate": 1.528770285077127e-05, "loss": 1.2761, "step": 12559 }, { "epoch": 0.34, "learning_rate": 1.5286952091359656e-05, "loss": 1.4177, "step": 12560 }, { "epoch": 0.34, "learning_rate": 1.5286201290585415e-05, "loss": 1.5112, "step": 12561 }, { "epoch": 0.34, "learning_rate": 1.528545044845442e-05, "loss": 1.3186, "step": 12562 }, { "epoch": 0.34, "learning_rate": 1.5284699564972548e-05, "loss": 1.2993, "step": 12563 }, { "epoch": 0.34, "learning_rate": 1.528394864014567e-05, "loss": 1.272, "step": 12564 }, { "epoch": 0.34, "learning_rate": 1.5283197673979666e-05, "loss": 1.4202, "step": 12565 }, { "epoch": 0.34, "learning_rate": 1.5282446666480404e-05, "loss": 1.0925, "step": 12566 }, { "epoch": 0.34, "learning_rate": 1.5281695617653765e-05, "loss": 1.3669, "step": 12567 }, { "epoch": 0.34, "learning_rate": 1.5280944527505623e-05, "loss": 1.2175, "step": 12568 }, { "epoch": 0.34, "learning_rate": 1.528019339604185e-05, "loss": 1.1938, "step": 12569 }, { "epoch": 0.34, "learning_rate": 1.527944222326833e-05, "loss": 1.3896, "step": 12570 }, { "epoch": 0.34, "learning_rate": 1.5278691009190936e-05, "loss": 1.2434, "step": 12571 }, { "epoch": 0.34, "learning_rate": 1.5277939753815547e-05, "loss": 1.2864, "step": 12572 }, { "epoch": 0.34, "learning_rate": 1.5277188457148043e-05, "loss": 1.3433, "step": 12573 }, { "epoch": 0.34, "learning_rate": 1.5276437119194293e-05, "loss": 1.2278, "step": 12574 }, { "epoch": 0.34, "learning_rate": 1.527568573996018e-05, "loss": 1.1956, "step": 12575 }, { "epoch": 0.34, "learning_rate": 1.5274934319451583e-05, "loss": 1.4067, "step": 12576 }, { "epoch": 0.34, "learning_rate": 1.5274182857674382e-05, "loss": 1.3015, "step": 12577 }, { "epoch": 0.34, "learning_rate": 1.527343135463445e-05, "loss": 1.2666, "step": 12578 }, { "epoch": 0.34, "learning_rate": 1.5272679810337677e-05, "loss": 1.2087, "step": 12579 }, { "epoch": 0.34, "learning_rate": 1.5271928224789932e-05, "loss": 1.415, "step": 12580 }, { "epoch": 0.34, "learning_rate": 1.5271176597997104e-05, "loss": 1.3538, "step": 12581 }, { "epoch": 0.34, "learning_rate": 1.5270424929965067e-05, "loss": 1.4414, "step": 12582 }, { "epoch": 0.34, "learning_rate": 1.5269673220699703e-05, "loss": 1.4121, "step": 12583 }, { "epoch": 0.34, "learning_rate": 1.526892147020689e-05, "loss": 1.5215, "step": 12584 }, { "epoch": 0.34, "learning_rate": 1.526816967849252e-05, "loss": 1.1348, "step": 12585 }, { "epoch": 0.34, "learning_rate": 1.5267417845562463e-05, "loss": 1.261, "step": 12586 }, { "epoch": 0.34, "learning_rate": 1.5266665971422607e-05, "loss": 1.1384, "step": 12587 }, { "epoch": 0.34, "learning_rate": 1.5265914056078833e-05, "loss": 1.3887, "step": 12588 }, { "epoch": 0.34, "learning_rate": 1.5265162099537024e-05, "loss": 1.4028, "step": 12589 }, { "epoch": 0.34, "learning_rate": 1.5264410101803063e-05, "loss": 1.248, "step": 12590 }, { "epoch": 0.34, "learning_rate": 1.526365806288283e-05, "loss": 1.1533, "step": 12591 }, { "epoch": 0.34, "learning_rate": 1.5262905982782218e-05, "loss": 1.3049, "step": 12592 }, { "epoch": 0.34, "learning_rate": 1.52621538615071e-05, "loss": 1.3772, "step": 12593 }, { "epoch": 0.34, "learning_rate": 1.5261401699063364e-05, "loss": 1.3359, "step": 12594 }, { "epoch": 0.34, "learning_rate": 1.5260649495456898e-05, "loss": 1.387, "step": 12595 }, { "epoch": 0.34, "learning_rate": 1.525989725069358e-05, "loss": 1.3516, "step": 12596 }, { "epoch": 0.34, "learning_rate": 1.5259144964779304e-05, "loss": 1.4331, "step": 12597 }, { "epoch": 0.34, "learning_rate": 1.5258392637719945e-05, "loss": 1.4065, "step": 12598 }, { "epoch": 0.34, "learning_rate": 1.5257640269521398e-05, "loss": 1.4514, "step": 12599 }, { "epoch": 0.34, "learning_rate": 1.5256887860189546e-05, "loss": 1.2656, "step": 12600 }, { "epoch": 0.34, "learning_rate": 1.5256135409730272e-05, "loss": 1.4646, "step": 12601 }, { "epoch": 0.34, "learning_rate": 1.5255382918149471e-05, "loss": 1.3799, "step": 12602 }, { "epoch": 0.34, "learning_rate": 1.5254630385453024e-05, "loss": 1.4382, "step": 12603 }, { "epoch": 0.34, "learning_rate": 1.5253877811646818e-05, "loss": 1.4385, "step": 12604 }, { "epoch": 0.34, "learning_rate": 1.5253125196736744e-05, "loss": 1.2683, "step": 12605 }, { "epoch": 0.34, "learning_rate": 1.5252372540728688e-05, "loss": 1.3989, "step": 12606 }, { "epoch": 0.34, "learning_rate": 1.525161984362854e-05, "loss": 1.3765, "step": 12607 }, { "epoch": 0.34, "learning_rate": 1.5250867105442188e-05, "loss": 1.3813, "step": 12608 }, { "epoch": 0.34, "learning_rate": 1.525011432617552e-05, "loss": 1.3594, "step": 12609 }, { "epoch": 0.34, "learning_rate": 1.5249361505834429e-05, "loss": 1.3809, "step": 12610 }, { "epoch": 0.34, "learning_rate": 1.5248608644424798e-05, "loss": 1.429, "step": 12611 }, { "epoch": 0.34, "learning_rate": 1.5247855741952524e-05, "loss": 1.4126, "step": 12612 }, { "epoch": 0.34, "learning_rate": 1.5247102798423492e-05, "loss": 1.293, "step": 12613 }, { "epoch": 0.34, "learning_rate": 1.5246349813843595e-05, "loss": 1.3672, "step": 12614 }, { "epoch": 0.34, "learning_rate": 1.5245596788218726e-05, "loss": 1.4133, "step": 12615 }, { "epoch": 0.34, "learning_rate": 1.5244843721554772e-05, "loss": 1.269, "step": 12616 }, { "epoch": 0.34, "learning_rate": 1.5244090613857628e-05, "loss": 1.4565, "step": 12617 }, { "epoch": 0.34, "learning_rate": 1.5243337465133186e-05, "loss": 1.2451, "step": 12618 }, { "epoch": 0.34, "learning_rate": 1.5242584275387335e-05, "loss": 1.4148, "step": 12619 }, { "epoch": 0.34, "learning_rate": 1.5241831044625972e-05, "loss": 1.2837, "step": 12620 }, { "epoch": 0.34, "learning_rate": 1.5241077772854988e-05, "loss": 1.2817, "step": 12621 }, { "epoch": 0.34, "learning_rate": 1.5240324460080277e-05, "loss": 1.3765, "step": 12622 }, { "epoch": 0.34, "learning_rate": 1.5239571106307729e-05, "loss": 1.4646, "step": 12623 }, { "epoch": 0.34, "learning_rate": 1.5238817711543243e-05, "loss": 1.3347, "step": 12624 }, { "epoch": 0.34, "learning_rate": 1.5238064275792708e-05, "loss": 1.3276, "step": 12625 }, { "epoch": 0.34, "learning_rate": 1.5237310799062024e-05, "loss": 1.4136, "step": 12626 }, { "epoch": 0.34, "learning_rate": 1.523655728135708e-05, "loss": 1.438, "step": 12627 }, { "epoch": 0.34, "learning_rate": 1.5235803722683775e-05, "loss": 1.3721, "step": 12628 }, { "epoch": 0.34, "learning_rate": 1.5235050123048006e-05, "loss": 1.2716, "step": 12629 }, { "epoch": 0.34, "learning_rate": 1.5234296482455664e-05, "loss": 1.2207, "step": 12630 }, { "epoch": 0.34, "learning_rate": 1.5233542800912648e-05, "loss": 1.7651, "step": 12631 }, { "epoch": 0.34, "learning_rate": 1.5232789078424855e-05, "loss": 1.1659, "step": 12632 }, { "epoch": 0.34, "learning_rate": 1.5232035314998182e-05, "loss": 1.3677, "step": 12633 }, { "epoch": 0.35, "learning_rate": 1.5231281510638522e-05, "loss": 1.2898, "step": 12634 }, { "epoch": 0.35, "learning_rate": 1.5230527665351778e-05, "loss": 1.375, "step": 12635 }, { "epoch": 0.35, "learning_rate": 1.5229773779143843e-05, "loss": 1.3774, "step": 12636 }, { "epoch": 0.35, "learning_rate": 1.5229019852020619e-05, "loss": 1.3218, "step": 12637 }, { "epoch": 0.35, "learning_rate": 1.5228265883988002e-05, "loss": 1.2966, "step": 12638 }, { "epoch": 0.35, "learning_rate": 1.5227511875051889e-05, "loss": 1.3667, "step": 12639 }, { "epoch": 0.35, "learning_rate": 1.5226757825218187e-05, "loss": 1.0862, "step": 12640 }, { "epoch": 0.35, "learning_rate": 1.5226003734492783e-05, "loss": 1.2339, "step": 12641 }, { "epoch": 0.35, "learning_rate": 1.5225249602881587e-05, "loss": 1.304, "step": 12642 }, { "epoch": 0.35, "learning_rate": 1.5224495430390494e-05, "loss": 1.3167, "step": 12643 }, { "epoch": 0.35, "learning_rate": 1.5223741217025408e-05, "loss": 1.3716, "step": 12644 }, { "epoch": 0.35, "learning_rate": 1.522298696279222e-05, "loss": 1.4878, "step": 12645 }, { "epoch": 0.35, "learning_rate": 1.5222232667696845e-05, "loss": 1.3416, "step": 12646 }, { "epoch": 0.35, "learning_rate": 1.5221478331745175e-05, "loss": 1.4077, "step": 12647 }, { "epoch": 0.35, "learning_rate": 1.5220723954943113e-05, "loss": 1.2559, "step": 12648 }, { "epoch": 0.35, "learning_rate": 1.5219969537296563e-05, "loss": 1.4062, "step": 12649 }, { "epoch": 0.35, "learning_rate": 1.5219215078811424e-05, "loss": 1.3081, "step": 12650 }, { "epoch": 0.35, "learning_rate": 1.5218460579493605e-05, "loss": 1.2468, "step": 12651 }, { "epoch": 0.35, "learning_rate": 1.5217706039349e-05, "loss": 1.4348, "step": 12652 }, { "epoch": 0.35, "learning_rate": 1.521695145838352e-05, "loss": 1.3296, "step": 12653 }, { "epoch": 0.35, "learning_rate": 1.521619683660306e-05, "loss": 1.2275, "step": 12654 }, { "epoch": 0.35, "learning_rate": 1.5215442174013536e-05, "loss": 1.7593, "step": 12655 }, { "epoch": 0.35, "learning_rate": 1.521468747062084e-05, "loss": 1.3733, "step": 12656 }, { "epoch": 0.35, "learning_rate": 1.521393272643088e-05, "loss": 1.2427, "step": 12657 }, { "epoch": 0.35, "learning_rate": 1.5213177941449564e-05, "loss": 1.4727, "step": 12658 }, { "epoch": 0.35, "learning_rate": 1.5212423115682798e-05, "loss": 1.4543, "step": 12659 }, { "epoch": 0.35, "learning_rate": 1.5211668249136477e-05, "loss": 1.3396, "step": 12660 }, { "epoch": 0.35, "learning_rate": 1.5210913341816521e-05, "loss": 1.3257, "step": 12661 }, { "epoch": 0.35, "learning_rate": 1.5210158393728826e-05, "loss": 1.3237, "step": 12662 }, { "epoch": 0.35, "learning_rate": 1.5209403404879305e-05, "loss": 1.3237, "step": 12663 }, { "epoch": 0.35, "learning_rate": 1.5208648375273858e-05, "loss": 1.291, "step": 12664 }, { "epoch": 0.35, "learning_rate": 1.5207893304918398e-05, "loss": 1.2356, "step": 12665 }, { "epoch": 0.35, "learning_rate": 1.5207138193818827e-05, "loss": 1.313, "step": 12666 }, { "epoch": 0.35, "learning_rate": 1.520638304198106e-05, "loss": 1.3635, "step": 12667 }, { "epoch": 0.35, "learning_rate": 1.5205627849410995e-05, "loss": 1.3716, "step": 12668 }, { "epoch": 0.35, "learning_rate": 1.520487261611455e-05, "loss": 1.4521, "step": 12669 }, { "epoch": 0.35, "learning_rate": 1.5204117342097626e-05, "loss": 1.3848, "step": 12670 }, { "epoch": 0.35, "learning_rate": 1.5203362027366137e-05, "loss": 1.3879, "step": 12671 }, { "epoch": 0.35, "learning_rate": 1.5202606671925988e-05, "loss": 1.2823, "step": 12672 }, { "epoch": 0.35, "learning_rate": 1.5201851275783094e-05, "loss": 1.207, "step": 12673 }, { "epoch": 0.35, "learning_rate": 1.5201095838943358e-05, "loss": 1.2844, "step": 12674 }, { "epoch": 0.35, "learning_rate": 1.5200340361412697e-05, "loss": 1.2549, "step": 12675 }, { "epoch": 0.35, "learning_rate": 1.5199584843197017e-05, "loss": 1.4153, "step": 12676 }, { "epoch": 0.35, "learning_rate": 1.519882928430223e-05, "loss": 1.3486, "step": 12677 }, { "epoch": 0.35, "learning_rate": 1.5198073684734245e-05, "loss": 1.3833, "step": 12678 }, { "epoch": 0.35, "learning_rate": 1.5197318044498981e-05, "loss": 1.1909, "step": 12679 }, { "epoch": 0.35, "learning_rate": 1.519656236360234e-05, "loss": 1.2493, "step": 12680 }, { "epoch": 0.35, "learning_rate": 1.5195806642050243e-05, "loss": 1.3101, "step": 12681 }, { "epoch": 0.35, "learning_rate": 1.5195050879848596e-05, "loss": 1.3582, "step": 12682 }, { "epoch": 0.35, "learning_rate": 1.5194295077003314e-05, "loss": 1.2554, "step": 12683 }, { "epoch": 0.35, "learning_rate": 1.5193539233520307e-05, "loss": 1.2478, "step": 12684 }, { "epoch": 0.35, "learning_rate": 1.5192783349405495e-05, "loss": 1.3721, "step": 12685 }, { "epoch": 0.35, "learning_rate": 1.5192027424664786e-05, "loss": 1.3308, "step": 12686 }, { "epoch": 0.35, "learning_rate": 1.5191271459304097e-05, "loss": 1.2563, "step": 12687 }, { "epoch": 0.35, "learning_rate": 1.5190515453329342e-05, "loss": 1.1799, "step": 12688 }, { "epoch": 0.35, "learning_rate": 1.5189759406746434e-05, "loss": 1.2981, "step": 12689 }, { "epoch": 0.35, "learning_rate": 1.5189003319561289e-05, "loss": 1.3757, "step": 12690 }, { "epoch": 0.35, "learning_rate": 1.5188247191779821e-05, "loss": 1.6714, "step": 12691 }, { "epoch": 0.35, "learning_rate": 1.5187491023407945e-05, "loss": 1.3318, "step": 12692 }, { "epoch": 0.35, "learning_rate": 1.518673481445158e-05, "loss": 1.3445, "step": 12693 }, { "epoch": 0.35, "learning_rate": 1.5185978564916642e-05, "loss": 1.4141, "step": 12694 }, { "epoch": 0.35, "learning_rate": 1.5185222274809047e-05, "loss": 1.2898, "step": 12695 }, { "epoch": 0.35, "learning_rate": 1.518446594413471e-05, "loss": 1.4937, "step": 12696 }, { "epoch": 0.35, "learning_rate": 1.5183709572899548e-05, "loss": 1.6758, "step": 12697 }, { "epoch": 0.35, "learning_rate": 1.5182953161109483e-05, "loss": 1.3228, "step": 12698 }, { "epoch": 0.35, "learning_rate": 1.5182196708770427e-05, "loss": 1.4019, "step": 12699 }, { "epoch": 0.35, "learning_rate": 1.5181440215888303e-05, "loss": 1.2285, "step": 12700 }, { "epoch": 0.35, "learning_rate": 1.5180683682469023e-05, "loss": 1.498, "step": 12701 }, { "epoch": 0.35, "learning_rate": 1.5179927108518514e-05, "loss": 1.3926, "step": 12702 }, { "epoch": 0.35, "learning_rate": 1.517917049404269e-05, "loss": 1.0964, "step": 12703 }, { "epoch": 0.35, "learning_rate": 1.5178413839047472e-05, "loss": 1.313, "step": 12704 }, { "epoch": 0.35, "learning_rate": 1.5177657143538777e-05, "loss": 1.4182, "step": 12705 }, { "epoch": 0.35, "learning_rate": 1.517690040752253e-05, "loss": 1.3057, "step": 12706 }, { "epoch": 0.35, "learning_rate": 1.5176143631004647e-05, "loss": 1.3401, "step": 12707 }, { "epoch": 0.35, "learning_rate": 1.5175386813991053e-05, "loss": 1.2419, "step": 12708 }, { "epoch": 0.35, "learning_rate": 1.5174629956487659e-05, "loss": 1.3564, "step": 12709 }, { "epoch": 0.35, "learning_rate": 1.5173873058500398e-05, "loss": 1.3096, "step": 12710 }, { "epoch": 0.35, "learning_rate": 1.517311612003519e-05, "loss": 1.2698, "step": 12711 }, { "epoch": 0.35, "learning_rate": 1.517235914109795e-05, "loss": 1.2749, "step": 12712 }, { "epoch": 0.35, "learning_rate": 1.5171602121694607e-05, "loss": 1.3799, "step": 12713 }, { "epoch": 0.35, "learning_rate": 1.5170845061831081e-05, "loss": 1.2959, "step": 12714 }, { "epoch": 0.35, "learning_rate": 1.517008796151329e-05, "loss": 1.4429, "step": 12715 }, { "epoch": 0.35, "learning_rate": 1.5169330820747168e-05, "loss": 1.2861, "step": 12716 }, { "epoch": 0.35, "learning_rate": 1.5168573639538629e-05, "loss": 1.3567, "step": 12717 }, { "epoch": 0.35, "learning_rate": 1.5167816417893602e-05, "loss": 1.3008, "step": 12718 }, { "epoch": 0.35, "learning_rate": 1.5167059155818006e-05, "loss": 1.2898, "step": 12719 }, { "epoch": 0.35, "learning_rate": 1.5166301853317773e-05, "loss": 1.3318, "step": 12720 }, { "epoch": 0.35, "learning_rate": 1.5165544510398823e-05, "loss": 1.3608, "step": 12721 }, { "epoch": 0.35, "learning_rate": 1.516478712706708e-05, "loss": 1.2036, "step": 12722 }, { "epoch": 0.35, "learning_rate": 1.5164029703328472e-05, "loss": 1.6528, "step": 12723 }, { "epoch": 0.35, "learning_rate": 1.5163272239188922e-05, "loss": 1.3442, "step": 12724 }, { "epoch": 0.35, "learning_rate": 1.516251473465436e-05, "loss": 1.2834, "step": 12725 }, { "epoch": 0.35, "learning_rate": 1.516175718973071e-05, "loss": 1.3418, "step": 12726 }, { "epoch": 0.35, "learning_rate": 1.5160999604423899e-05, "loss": 1.2378, "step": 12727 }, { "epoch": 0.35, "learning_rate": 1.5160241978739853e-05, "loss": 1.3911, "step": 12728 }, { "epoch": 0.35, "learning_rate": 1.5159484312684502e-05, "loss": 1.2341, "step": 12729 }, { "epoch": 0.35, "learning_rate": 1.5158726606263772e-05, "loss": 1.2759, "step": 12730 }, { "epoch": 0.35, "learning_rate": 1.5157968859483587e-05, "loss": 1.1528, "step": 12731 }, { "epoch": 0.35, "learning_rate": 1.5157211072349885e-05, "loss": 1.3845, "step": 12732 }, { "epoch": 0.35, "learning_rate": 1.5156453244868585e-05, "loss": 1.2285, "step": 12733 }, { "epoch": 0.35, "learning_rate": 1.5155695377045621e-05, "loss": 1.4194, "step": 12734 }, { "epoch": 0.35, "learning_rate": 1.5154937468886918e-05, "loss": 1.2253, "step": 12735 }, { "epoch": 0.35, "learning_rate": 1.515417952039841e-05, "loss": 1.3899, "step": 12736 }, { "epoch": 0.35, "learning_rate": 1.5153421531586028e-05, "loss": 1.3359, "step": 12737 }, { "epoch": 0.35, "learning_rate": 1.5152663502455696e-05, "loss": 1.3865, "step": 12738 }, { "epoch": 0.35, "learning_rate": 1.5151905433013348e-05, "loss": 1.7295, "step": 12739 }, { "epoch": 0.35, "learning_rate": 1.5151147323264915e-05, "loss": 1.3691, "step": 12740 }, { "epoch": 0.35, "learning_rate": 1.5150389173216327e-05, "loss": 1.2617, "step": 12741 }, { "epoch": 0.35, "learning_rate": 1.5149630982873515e-05, "loss": 1.4026, "step": 12742 }, { "epoch": 0.35, "learning_rate": 1.5148872752242417e-05, "loss": 1.386, "step": 12743 }, { "epoch": 0.35, "learning_rate": 1.5148114481328952e-05, "loss": 1.2585, "step": 12744 }, { "epoch": 0.35, "learning_rate": 1.5147356170139068e-05, "loss": 1.2812, "step": 12745 }, { "epoch": 0.35, "learning_rate": 1.5146597818678684e-05, "loss": 1.2524, "step": 12746 }, { "epoch": 0.35, "learning_rate": 1.5145839426953742e-05, "loss": 1.4341, "step": 12747 }, { "epoch": 0.35, "learning_rate": 1.5145080994970169e-05, "loss": 1.3979, "step": 12748 }, { "epoch": 0.35, "learning_rate": 1.5144322522733905e-05, "loss": 1.3345, "step": 12749 }, { "epoch": 0.35, "learning_rate": 1.5143564010250877e-05, "loss": 1.3308, "step": 12750 }, { "epoch": 0.35, "learning_rate": 1.5142805457527025e-05, "loss": 1.3821, "step": 12751 }, { "epoch": 0.35, "learning_rate": 1.5142046864568284e-05, "loss": 1.3298, "step": 12752 }, { "epoch": 0.35, "learning_rate": 1.5141288231380579e-05, "loss": 1.3318, "step": 12753 }, { "epoch": 0.35, "learning_rate": 1.5140529557969858e-05, "loss": 1.3979, "step": 12754 }, { "epoch": 0.35, "learning_rate": 1.513977084434205e-05, "loss": 1.301, "step": 12755 }, { "epoch": 0.35, "learning_rate": 1.5139012090503092e-05, "loss": 1.2434, "step": 12756 }, { "epoch": 0.35, "learning_rate": 1.513825329645892e-05, "loss": 1.3833, "step": 12757 }, { "epoch": 0.35, "learning_rate": 1.5137494462215468e-05, "loss": 1.324, "step": 12758 }, { "epoch": 0.35, "learning_rate": 1.5136735587778679e-05, "loss": 1.3208, "step": 12759 }, { "epoch": 0.35, "learning_rate": 1.5135976673154484e-05, "loss": 1.2751, "step": 12760 }, { "epoch": 0.35, "learning_rate": 1.5135217718348822e-05, "loss": 1.3718, "step": 12761 }, { "epoch": 0.35, "learning_rate": 1.5134458723367633e-05, "loss": 1.4331, "step": 12762 }, { "epoch": 0.35, "learning_rate": 1.5133699688216854e-05, "loss": 1.2832, "step": 12763 }, { "epoch": 0.35, "learning_rate": 1.513294061290242e-05, "loss": 1.2886, "step": 12764 }, { "epoch": 0.35, "learning_rate": 1.5132181497430276e-05, "loss": 1.4429, "step": 12765 }, { "epoch": 0.35, "learning_rate": 1.5131422341806352e-05, "loss": 1.4043, "step": 12766 }, { "epoch": 0.35, "learning_rate": 1.51306631460366e-05, "loss": 1.384, "step": 12767 }, { "epoch": 0.35, "learning_rate": 1.5129903910126946e-05, "loss": 1.2693, "step": 12768 }, { "epoch": 0.35, "learning_rate": 1.512914463408334e-05, "loss": 1.2297, "step": 12769 }, { "epoch": 0.35, "learning_rate": 1.5128385317911714e-05, "loss": 1.7461, "step": 12770 }, { "epoch": 0.35, "learning_rate": 1.5127625961618013e-05, "loss": 1.2615, "step": 12771 }, { "epoch": 0.35, "learning_rate": 1.5126866565208178e-05, "loss": 1.3242, "step": 12772 }, { "epoch": 0.35, "learning_rate": 1.5126107128688152e-05, "loss": 1.3113, "step": 12773 }, { "epoch": 0.35, "learning_rate": 1.5125347652063873e-05, "loss": 1.231, "step": 12774 }, { "epoch": 0.35, "learning_rate": 1.5124588135341287e-05, "loss": 1.2573, "step": 12775 }, { "epoch": 0.35, "learning_rate": 1.512382857852633e-05, "loss": 1.3081, "step": 12776 }, { "epoch": 0.35, "learning_rate": 1.512306898162495e-05, "loss": 1.2151, "step": 12777 }, { "epoch": 0.35, "learning_rate": 1.5122309344643085e-05, "loss": 1.7715, "step": 12778 }, { "epoch": 0.35, "learning_rate": 1.5121549667586681e-05, "loss": 1.3979, "step": 12779 }, { "epoch": 0.35, "learning_rate": 1.512078995046168e-05, "loss": 1.2368, "step": 12780 }, { "epoch": 0.35, "learning_rate": 1.512003019327403e-05, "loss": 1.2363, "step": 12781 }, { "epoch": 0.35, "learning_rate": 1.5119270396029666e-05, "loss": 1.3782, "step": 12782 }, { "epoch": 0.35, "learning_rate": 1.511851055873454e-05, "loss": 1.2209, "step": 12783 }, { "epoch": 0.35, "learning_rate": 1.5117750681394597e-05, "loss": 1.1968, "step": 12784 }, { "epoch": 0.35, "learning_rate": 1.5116990764015777e-05, "loss": 1.3511, "step": 12785 }, { "epoch": 0.35, "learning_rate": 1.5116230806604024e-05, "loss": 1.3347, "step": 12786 }, { "epoch": 0.35, "learning_rate": 1.5115470809165292e-05, "loss": 1.3992, "step": 12787 }, { "epoch": 0.35, "learning_rate": 1.5114710771705518e-05, "loss": 1.3398, "step": 12788 }, { "epoch": 0.35, "learning_rate": 1.5113950694230654e-05, "loss": 1.3552, "step": 12789 }, { "epoch": 0.35, "learning_rate": 1.5113190576746645e-05, "loss": 1.3564, "step": 12790 }, { "epoch": 0.35, "learning_rate": 1.5112430419259438e-05, "loss": 1.2395, "step": 12791 }, { "epoch": 0.35, "learning_rate": 1.5111670221774977e-05, "loss": 1.4438, "step": 12792 }, { "epoch": 0.35, "learning_rate": 1.5110909984299216e-05, "loss": 1.3667, "step": 12793 }, { "epoch": 0.35, "learning_rate": 1.5110149706838093e-05, "loss": 1.2317, "step": 12794 }, { "epoch": 0.35, "learning_rate": 1.5109389389397566e-05, "loss": 1.1897, "step": 12795 }, { "epoch": 0.35, "learning_rate": 1.5108629031983577e-05, "loss": 1.373, "step": 12796 }, { "epoch": 0.35, "learning_rate": 1.5107868634602079e-05, "loss": 1.3538, "step": 12797 }, { "epoch": 0.35, "learning_rate": 1.5107108197259015e-05, "loss": 1.0709, "step": 12798 }, { "epoch": 0.35, "learning_rate": 1.5106347719960341e-05, "loss": 1.3782, "step": 12799 }, { "epoch": 0.35, "learning_rate": 1.5105587202712002e-05, "loss": 1.385, "step": 12800 }, { "epoch": 0.35, "learning_rate": 1.5104826645519953e-05, "loss": 1.3088, "step": 12801 }, { "epoch": 0.35, "learning_rate": 1.5104066048390135e-05, "loss": 1.2017, "step": 12802 }, { "epoch": 0.35, "learning_rate": 1.5103305411328508e-05, "loss": 1.1743, "step": 12803 }, { "epoch": 0.35, "learning_rate": 1.5102544734341018e-05, "loss": 1.3623, "step": 12804 }, { "epoch": 0.35, "learning_rate": 1.5101784017433616e-05, "loss": 1.3223, "step": 12805 }, { "epoch": 0.35, "learning_rate": 1.5101023260612259e-05, "loss": 1.2524, "step": 12806 }, { "epoch": 0.35, "learning_rate": 1.5100262463882894e-05, "loss": 1.251, "step": 12807 }, { "epoch": 0.35, "learning_rate": 1.5099501627251471e-05, "loss": 1.377, "step": 12808 }, { "epoch": 0.35, "learning_rate": 1.5098740750723945e-05, "loss": 1.4077, "step": 12809 }, { "epoch": 0.35, "learning_rate": 1.5097979834306271e-05, "loss": 1.2778, "step": 12810 }, { "epoch": 0.35, "learning_rate": 1.5097218878004398e-05, "loss": 1.4473, "step": 12811 }, { "epoch": 0.35, "learning_rate": 1.5096457881824284e-05, "loss": 1.3557, "step": 12812 }, { "epoch": 0.35, "learning_rate": 1.5095696845771879e-05, "loss": 1.3167, "step": 12813 }, { "epoch": 0.35, "learning_rate": 1.5094935769853139e-05, "loss": 1.2605, "step": 12814 }, { "epoch": 0.35, "learning_rate": 1.5094174654074016e-05, "loss": 1.4409, "step": 12815 }, { "epoch": 0.35, "learning_rate": 1.5093413498440465e-05, "loss": 1.2917, "step": 12816 }, { "epoch": 0.35, "learning_rate": 1.5092652302958441e-05, "loss": 1.2395, "step": 12817 }, { "epoch": 0.35, "learning_rate": 1.5091891067633904e-05, "loss": 1.3682, "step": 12818 }, { "epoch": 0.35, "learning_rate": 1.5091129792472804e-05, "loss": 1.1475, "step": 12819 }, { "epoch": 0.35, "learning_rate": 1.5090368477481096e-05, "loss": 1.2634, "step": 12820 }, { "epoch": 0.35, "learning_rate": 1.5089607122664743e-05, "loss": 1.2566, "step": 12821 }, { "epoch": 0.35, "learning_rate": 1.5088845728029695e-05, "loss": 1.3086, "step": 12822 }, { "epoch": 0.35, "learning_rate": 1.5088084293581911e-05, "loss": 1.3513, "step": 12823 }, { "epoch": 0.35, "learning_rate": 1.5087322819327349e-05, "loss": 1.3333, "step": 12824 }, { "epoch": 0.35, "learning_rate": 1.5086561305271966e-05, "loss": 1.709, "step": 12825 }, { "epoch": 0.35, "learning_rate": 1.5085799751421717e-05, "loss": 1.833, "step": 12826 }, { "epoch": 0.35, "learning_rate": 1.5085038157782563e-05, "loss": 1.3503, "step": 12827 }, { "epoch": 0.35, "learning_rate": 1.5084276524360462e-05, "loss": 1.3618, "step": 12828 }, { "epoch": 0.35, "learning_rate": 1.508351485116137e-05, "loss": 1.3616, "step": 12829 }, { "epoch": 0.35, "learning_rate": 1.5082753138191252e-05, "loss": 1.373, "step": 12830 }, { "epoch": 0.35, "learning_rate": 1.508199138545606e-05, "loss": 1.2156, "step": 12831 }, { "epoch": 0.35, "learning_rate": 1.5081229592961762e-05, "loss": 1.3274, "step": 12832 }, { "epoch": 0.35, "learning_rate": 1.5080467760714305e-05, "loss": 1.4937, "step": 12833 }, { "epoch": 0.35, "learning_rate": 1.5079705888719665e-05, "loss": 1.3945, "step": 12834 }, { "epoch": 0.35, "learning_rate": 1.5078943976983792e-05, "loss": 1.335, "step": 12835 }, { "epoch": 0.35, "learning_rate": 1.5078182025512649e-05, "loss": 1.4297, "step": 12836 }, { "epoch": 0.35, "learning_rate": 1.5077420034312197e-05, "loss": 1.3889, "step": 12837 }, { "epoch": 0.35, "learning_rate": 1.50766580033884e-05, "loss": 1.249, "step": 12838 }, { "epoch": 0.35, "learning_rate": 1.5075895932747217e-05, "loss": 1.478, "step": 12839 }, { "epoch": 0.35, "learning_rate": 1.5075133822394615e-05, "loss": 1.429, "step": 12840 }, { "epoch": 0.35, "learning_rate": 1.5074371672336545e-05, "loss": 1.6812, "step": 12841 }, { "epoch": 0.35, "learning_rate": 1.5073609482578984e-05, "loss": 1.3823, "step": 12842 }, { "epoch": 0.35, "learning_rate": 1.5072847253127884e-05, "loss": 1.312, "step": 12843 }, { "epoch": 0.35, "learning_rate": 1.5072084983989217e-05, "loss": 1.1855, "step": 12844 }, { "epoch": 0.35, "learning_rate": 1.5071322675168935e-05, "loss": 1.291, "step": 12845 }, { "epoch": 0.35, "learning_rate": 1.5070560326673016e-05, "loss": 1.3105, "step": 12846 }, { "epoch": 0.35, "learning_rate": 1.5069797938507413e-05, "loss": 1.3396, "step": 12847 }, { "epoch": 0.35, "learning_rate": 1.5069035510678097e-05, "loss": 1.5278, "step": 12848 }, { "epoch": 0.35, "learning_rate": 1.506827304319103e-05, "loss": 1.4241, "step": 12849 }, { "epoch": 0.35, "learning_rate": 1.5067510536052177e-05, "loss": 1.3264, "step": 12850 }, { "epoch": 0.35, "learning_rate": 1.5066747989267509e-05, "loss": 1.353, "step": 12851 }, { "epoch": 0.35, "learning_rate": 1.5065985402842981e-05, "loss": 1.2954, "step": 12852 }, { "epoch": 0.35, "learning_rate": 1.5065222776784571e-05, "loss": 1.332, "step": 12853 }, { "epoch": 0.35, "learning_rate": 1.5064460111098236e-05, "loss": 1.3501, "step": 12854 }, { "epoch": 0.35, "learning_rate": 1.506369740578995e-05, "loss": 1.3157, "step": 12855 }, { "epoch": 0.35, "learning_rate": 1.5062934660865672e-05, "loss": 1.4165, "step": 12856 }, { "epoch": 0.35, "learning_rate": 1.5062171876331377e-05, "loss": 1.3767, "step": 12857 }, { "epoch": 0.35, "learning_rate": 1.5061409052193031e-05, "loss": 1.4326, "step": 12858 }, { "epoch": 0.35, "learning_rate": 1.5060646188456598e-05, "loss": 1.7378, "step": 12859 }, { "epoch": 0.35, "learning_rate": 1.505988328512805e-05, "loss": 1.4187, "step": 12860 }, { "epoch": 0.35, "learning_rate": 1.5059120342213353e-05, "loss": 1.4741, "step": 12861 }, { "epoch": 0.35, "learning_rate": 1.5058357359718478e-05, "loss": 1.2898, "step": 12862 }, { "epoch": 0.35, "learning_rate": 1.5057594337649394e-05, "loss": 1.3806, "step": 12863 }, { "epoch": 0.35, "learning_rate": 1.505683127601207e-05, "loss": 1.2786, "step": 12864 }, { "epoch": 0.35, "learning_rate": 1.5056068174812475e-05, "loss": 1.2314, "step": 12865 }, { "epoch": 0.35, "learning_rate": 1.5055305034056583e-05, "loss": 1.4612, "step": 12866 }, { "epoch": 0.35, "learning_rate": 1.5054541853750359e-05, "loss": 1.3977, "step": 12867 }, { "epoch": 0.35, "learning_rate": 1.5053778633899776e-05, "loss": 1.2705, "step": 12868 }, { "epoch": 0.35, "learning_rate": 1.5053015374510809e-05, "loss": 1.1721, "step": 12869 }, { "epoch": 0.35, "learning_rate": 1.5052252075589422e-05, "loss": 1.23, "step": 12870 }, { "epoch": 0.35, "learning_rate": 1.5051488737141593e-05, "loss": 1.2842, "step": 12871 }, { "epoch": 0.35, "learning_rate": 1.5050725359173291e-05, "loss": 1.2568, "step": 12872 }, { "epoch": 0.35, "learning_rate": 1.5049961941690487e-05, "loss": 1.2798, "step": 12873 }, { "epoch": 0.35, "learning_rate": 1.5049198484699159e-05, "loss": 1.3145, "step": 12874 }, { "epoch": 0.35, "learning_rate": 1.5048434988205273e-05, "loss": 1.4634, "step": 12875 }, { "epoch": 0.35, "learning_rate": 1.5047671452214804e-05, "loss": 1.2366, "step": 12876 }, { "epoch": 0.35, "learning_rate": 1.5046907876733735e-05, "loss": 1.3193, "step": 12877 }, { "epoch": 0.35, "learning_rate": 1.5046144261768026e-05, "loss": 1.3335, "step": 12878 }, { "epoch": 0.35, "learning_rate": 1.5045380607323657e-05, "loss": 1.1068, "step": 12879 }, { "epoch": 0.35, "learning_rate": 1.50446169134066e-05, "loss": 1.2893, "step": 12880 }, { "epoch": 0.35, "learning_rate": 1.5043853180022838e-05, "loss": 1.2896, "step": 12881 }, { "epoch": 0.35, "learning_rate": 1.5043089407178338e-05, "loss": 1.3672, "step": 12882 }, { "epoch": 0.35, "learning_rate": 1.5042325594879079e-05, "loss": 1.3582, "step": 12883 }, { "epoch": 0.35, "learning_rate": 1.5041561743131034e-05, "loss": 1.2434, "step": 12884 }, { "epoch": 0.35, "learning_rate": 1.5040797851940184e-05, "loss": 1.4102, "step": 12885 }, { "epoch": 0.35, "learning_rate": 1.5040033921312497e-05, "loss": 1.271, "step": 12886 }, { "epoch": 0.35, "learning_rate": 1.5039269951253958e-05, "loss": 1.3386, "step": 12887 }, { "epoch": 0.35, "learning_rate": 1.503850594177054e-05, "loss": 1.395, "step": 12888 }, { "epoch": 0.35, "learning_rate": 1.5037741892868223e-05, "loss": 1.2495, "step": 12889 }, { "epoch": 0.35, "learning_rate": 1.5036977804552977e-05, "loss": 1.2947, "step": 12890 }, { "epoch": 0.35, "learning_rate": 1.5036213676830791e-05, "loss": 1.4546, "step": 12891 }, { "epoch": 0.35, "learning_rate": 1.5035449509707633e-05, "loss": 1.3269, "step": 12892 }, { "epoch": 0.35, "learning_rate": 1.5034685303189486e-05, "loss": 1.3074, "step": 12893 }, { "epoch": 0.35, "learning_rate": 1.5033921057282332e-05, "loss": 1.3484, "step": 12894 }, { "epoch": 0.35, "learning_rate": 1.5033156771992144e-05, "loss": 1.4165, "step": 12895 }, { "epoch": 0.35, "learning_rate": 1.5032392447324906e-05, "loss": 1.1831, "step": 12896 }, { "epoch": 0.35, "learning_rate": 1.5031628083286593e-05, "loss": 1.2666, "step": 12897 }, { "epoch": 0.35, "learning_rate": 1.5030863679883192e-05, "loss": 1.3608, "step": 12898 }, { "epoch": 0.35, "learning_rate": 1.5030099237120674e-05, "loss": 1.4272, "step": 12899 }, { "epoch": 0.35, "learning_rate": 1.5029334755005027e-05, "loss": 1.1628, "step": 12900 }, { "epoch": 0.35, "learning_rate": 1.5028570233542232e-05, "loss": 0.9785, "step": 12901 }, { "epoch": 0.35, "learning_rate": 1.5027805672738267e-05, "loss": 1.2798, "step": 12902 }, { "epoch": 0.35, "learning_rate": 1.5027041072599115e-05, "loss": 1.2954, "step": 12903 }, { "epoch": 0.35, "learning_rate": 1.5026276433130758e-05, "loss": 1.324, "step": 12904 }, { "epoch": 0.35, "learning_rate": 1.5025511754339178e-05, "loss": 1.3684, "step": 12905 }, { "epoch": 0.35, "learning_rate": 1.5024747036230354e-05, "loss": 1.3716, "step": 12906 }, { "epoch": 0.35, "learning_rate": 1.5023982278810274e-05, "loss": 1.4089, "step": 12907 }, { "epoch": 0.35, "learning_rate": 1.502321748208492e-05, "loss": 1.2971, "step": 12908 }, { "epoch": 0.35, "learning_rate": 1.5022452646060273e-05, "loss": 1.4392, "step": 12909 }, { "epoch": 0.35, "learning_rate": 1.502168777074232e-05, "loss": 1.2913, "step": 12910 }, { "epoch": 0.35, "learning_rate": 1.502092285613704e-05, "loss": 1.4888, "step": 12911 }, { "epoch": 0.35, "learning_rate": 1.5020157902250423e-05, "loss": 1.3135, "step": 12912 }, { "epoch": 0.35, "learning_rate": 1.5019392909088448e-05, "loss": 1.2009, "step": 12913 }, { "epoch": 0.35, "learning_rate": 1.501862787665711e-05, "loss": 1.2827, "step": 12914 }, { "epoch": 0.35, "learning_rate": 1.501786280496238e-05, "loss": 1.1895, "step": 12915 }, { "epoch": 0.35, "learning_rate": 1.5017097694010256e-05, "loss": 1.3528, "step": 12916 }, { "epoch": 0.35, "learning_rate": 1.5016332543806717e-05, "loss": 1.1506, "step": 12917 }, { "epoch": 0.35, "learning_rate": 1.5015567354357752e-05, "loss": 1.1868, "step": 12918 }, { "epoch": 0.35, "learning_rate": 1.5014802125669345e-05, "loss": 1.2737, "step": 12919 }, { "epoch": 0.35, "learning_rate": 1.5014036857747484e-05, "loss": 1.417, "step": 12920 }, { "epoch": 0.35, "learning_rate": 1.5013271550598158e-05, "loss": 1.2905, "step": 12921 }, { "epoch": 0.35, "learning_rate": 1.5012506204227352e-05, "loss": 1.3384, "step": 12922 }, { "epoch": 0.35, "learning_rate": 1.5011740818641057e-05, "loss": 1.2705, "step": 12923 }, { "epoch": 0.35, "learning_rate": 1.5010975393845257e-05, "loss": 1.7583, "step": 12924 }, { "epoch": 0.35, "learning_rate": 1.5010209929845938e-05, "loss": 1.7466, "step": 12925 }, { "epoch": 0.35, "learning_rate": 1.5009444426649096e-05, "loss": 1.4819, "step": 12926 }, { "epoch": 0.35, "learning_rate": 1.5008678884260715e-05, "loss": 1.342, "step": 12927 }, { "epoch": 0.35, "learning_rate": 1.5007913302686788e-05, "loss": 1.2664, "step": 12928 }, { "epoch": 0.35, "learning_rate": 1.5007147681933298e-05, "loss": 1.2959, "step": 12929 }, { "epoch": 0.35, "learning_rate": 1.5006382022006245e-05, "loss": 1.4219, "step": 12930 }, { "epoch": 0.35, "learning_rate": 1.5005616322911609e-05, "loss": 1.4314, "step": 12931 }, { "epoch": 0.35, "learning_rate": 1.5004850584655385e-05, "loss": 1.3389, "step": 12932 }, { "epoch": 0.35, "learning_rate": 1.5004084807243567e-05, "loss": 1.3076, "step": 12933 }, { "epoch": 0.35, "learning_rate": 1.5003318990682139e-05, "loss": 1.2607, "step": 12934 }, { "epoch": 0.35, "learning_rate": 1.5002553134977096e-05, "loss": 1.4321, "step": 12935 }, { "epoch": 0.35, "learning_rate": 1.500178724013443e-05, "loss": 1.2527, "step": 12936 }, { "epoch": 0.35, "learning_rate": 1.5001021306160133e-05, "loss": 1.2195, "step": 12937 }, { "epoch": 0.35, "learning_rate": 1.5000255333060198e-05, "loss": 1.3701, "step": 12938 }, { "epoch": 0.35, "learning_rate": 1.4999489320840614e-05, "loss": 1.731, "step": 12939 }, { "epoch": 0.35, "learning_rate": 1.499872326950738e-05, "loss": 1.2134, "step": 12940 }, { "epoch": 0.35, "learning_rate": 1.4997957179066482e-05, "loss": 1.4468, "step": 12941 }, { "epoch": 0.35, "learning_rate": 1.499719104952392e-05, "loss": 1.3606, "step": 12942 }, { "epoch": 0.35, "learning_rate": 1.4996424880885683e-05, "loss": 1.2871, "step": 12943 }, { "epoch": 0.35, "learning_rate": 1.4995658673157769e-05, "loss": 1.7754, "step": 12944 }, { "epoch": 0.35, "learning_rate": 1.4994892426346168e-05, "loss": 1.3604, "step": 12945 }, { "epoch": 0.35, "learning_rate": 1.4994126140456882e-05, "loss": 1.2517, "step": 12946 }, { "epoch": 0.35, "learning_rate": 1.4993359815495895e-05, "loss": 1.3447, "step": 12947 }, { "epoch": 0.35, "learning_rate": 1.4992593451469215e-05, "loss": 1.2168, "step": 12948 }, { "epoch": 0.35, "learning_rate": 1.499182704838283e-05, "loss": 1.3892, "step": 12949 }, { "epoch": 0.35, "learning_rate": 1.4991060606242738e-05, "loss": 1.3025, "step": 12950 }, { "epoch": 0.35, "learning_rate": 1.4990294125054931e-05, "loss": 1.3181, "step": 12951 }, { "epoch": 0.35, "learning_rate": 1.4989527604825414e-05, "loss": 1.1909, "step": 12952 }, { "epoch": 0.35, "learning_rate": 1.4988761045560176e-05, "loss": 1.394, "step": 12953 }, { "epoch": 0.35, "learning_rate": 1.4987994447265219e-05, "loss": 1.2932, "step": 12954 }, { "epoch": 0.35, "learning_rate": 1.4987227809946538e-05, "loss": 1.5581, "step": 12955 }, { "epoch": 0.35, "learning_rate": 1.4986461133610133e-05, "loss": 1.4795, "step": 12956 }, { "epoch": 0.35, "learning_rate": 1.4985694418262e-05, "loss": 1.4634, "step": 12957 }, { "epoch": 0.35, "learning_rate": 1.4984927663908137e-05, "loss": 1.3206, "step": 12958 }, { "epoch": 0.35, "learning_rate": 1.4984160870554548e-05, "loss": 1.3301, "step": 12959 }, { "epoch": 0.35, "learning_rate": 1.4983394038207223e-05, "loss": 1.3604, "step": 12960 }, { "epoch": 0.35, "learning_rate": 1.498262716687217e-05, "loss": 1.2764, "step": 12961 }, { "epoch": 0.35, "learning_rate": 1.4981860256555382e-05, "loss": 1.4214, "step": 12962 }, { "epoch": 0.35, "learning_rate": 1.4981093307262866e-05, "loss": 1.2024, "step": 12963 }, { "epoch": 0.35, "learning_rate": 1.4980326319000615e-05, "loss": 1.4399, "step": 12964 }, { "epoch": 0.35, "learning_rate": 1.4979559291774637e-05, "loss": 1.3813, "step": 12965 }, { "epoch": 0.35, "learning_rate": 1.4978792225590923e-05, "loss": 1.2639, "step": 12966 }, { "epoch": 0.35, "learning_rate": 1.4978025120455484e-05, "loss": 1.2476, "step": 12967 }, { "epoch": 0.35, "learning_rate": 1.4977257976374315e-05, "loss": 1.3533, "step": 12968 }, { "epoch": 0.35, "learning_rate": 1.4976490793353422e-05, "loss": 1.2832, "step": 12969 }, { "epoch": 0.35, "learning_rate": 1.4975723571398803e-05, "loss": 1.3994, "step": 12970 }, { "epoch": 0.35, "learning_rate": 1.4974956310516464e-05, "loss": 1.3289, "step": 12971 }, { "epoch": 0.35, "learning_rate": 1.4974189010712405e-05, "loss": 1.1807, "step": 12972 }, { "epoch": 0.35, "learning_rate": 1.4973421671992632e-05, "loss": 1.478, "step": 12973 }, { "epoch": 0.35, "learning_rate": 1.4972654294363142e-05, "loss": 1.1841, "step": 12974 }, { "epoch": 0.35, "learning_rate": 1.497188687782995e-05, "loss": 1.4102, "step": 12975 }, { "epoch": 0.35, "learning_rate": 1.4971119422399047e-05, "loss": 1.3442, "step": 12976 }, { "epoch": 0.35, "learning_rate": 1.4970351928076447e-05, "loss": 1.2944, "step": 12977 }, { "epoch": 0.35, "learning_rate": 1.4969584394868148e-05, "loss": 1.217, "step": 12978 }, { "epoch": 0.35, "learning_rate": 1.4968816822780161e-05, "loss": 1.2629, "step": 12979 }, { "epoch": 0.35, "learning_rate": 1.4968049211818487e-05, "loss": 1.1546, "step": 12980 }, { "epoch": 0.35, "learning_rate": 1.4967281561989131e-05, "loss": 1.3103, "step": 12981 }, { "epoch": 0.35, "learning_rate": 1.49665138732981e-05, "loss": 1.2795, "step": 12982 }, { "epoch": 0.35, "learning_rate": 1.4965746145751401e-05, "loss": 1.2969, "step": 12983 }, { "epoch": 0.35, "learning_rate": 1.4964978379355035e-05, "loss": 1.354, "step": 12984 }, { "epoch": 0.35, "learning_rate": 1.4964210574115017e-05, "loss": 1.3472, "step": 12985 }, { "epoch": 0.35, "learning_rate": 1.4963442730037348e-05, "loss": 1.3423, "step": 12986 }, { "epoch": 0.35, "learning_rate": 1.4962674847128037e-05, "loss": 1.4124, "step": 12987 }, { "epoch": 0.35, "learning_rate": 1.496190692539309e-05, "loss": 1.3948, "step": 12988 }, { "epoch": 0.35, "learning_rate": 1.496113896483852e-05, "loss": 1.0936, "step": 12989 }, { "epoch": 0.35, "learning_rate": 1.496037096547033e-05, "loss": 1.3091, "step": 12990 }, { "epoch": 0.35, "learning_rate": 1.4959602927294532e-05, "loss": 1.1455, "step": 12991 }, { "epoch": 0.35, "learning_rate": 1.495883485031713e-05, "loss": 1.3096, "step": 12992 }, { "epoch": 0.35, "learning_rate": 1.4958066734544136e-05, "loss": 1.3599, "step": 12993 }, { "epoch": 0.35, "learning_rate": 1.4957298579981561e-05, "loss": 1.4946, "step": 12994 }, { "epoch": 0.35, "learning_rate": 1.4956530386635413e-05, "loss": 1.3899, "step": 12995 }, { "epoch": 0.35, "learning_rate": 1.49557621545117e-05, "loss": 1.4146, "step": 12996 }, { "epoch": 0.35, "learning_rate": 1.4954993883616438e-05, "loss": 1.1873, "step": 12997 }, { "epoch": 0.35, "learning_rate": 1.4954225573955632e-05, "loss": 1.324, "step": 12998 }, { "epoch": 0.35, "learning_rate": 1.4953457225535295e-05, "loss": 1.241, "step": 12999 }, { "epoch": 0.36, "learning_rate": 1.4952688838361436e-05, "loss": 1.4121, "step": 13000 }, { "epoch": 0.36, "learning_rate": 1.495192041244007e-05, "loss": 1.2498, "step": 13001 }, { "epoch": 0.36, "learning_rate": 1.4951151947777207e-05, "loss": 1.137, "step": 13002 }, { "epoch": 0.36, "learning_rate": 1.4950383444378858e-05, "loss": 1.3101, "step": 13003 }, { "epoch": 0.36, "learning_rate": 1.494961490225104e-05, "loss": 1.342, "step": 13004 }, { "epoch": 0.36, "learning_rate": 1.494884632139976e-05, "loss": 1.3423, "step": 13005 }, { "epoch": 0.36, "learning_rate": 1.4948077701831035e-05, "loss": 1.29, "step": 13006 }, { "epoch": 0.36, "learning_rate": 1.4947309043550875e-05, "loss": 1.3921, "step": 13007 }, { "epoch": 0.36, "learning_rate": 1.4946540346565297e-05, "loss": 1.3948, "step": 13008 }, { "epoch": 0.36, "learning_rate": 1.4945771610880311e-05, "loss": 1.7422, "step": 13009 }, { "epoch": 0.36, "learning_rate": 1.4945002836501936e-05, "loss": 1.3682, "step": 13010 }, { "epoch": 0.36, "learning_rate": 1.4944234023436183e-05, "loss": 1.3484, "step": 13011 }, { "epoch": 0.36, "learning_rate": 1.4943465171689068e-05, "loss": 1.2168, "step": 13012 }, { "epoch": 0.36, "learning_rate": 1.4942696281266607e-05, "loss": 1.3557, "step": 13013 }, { "epoch": 0.36, "learning_rate": 1.4941927352174814e-05, "loss": 1.8247, "step": 13014 }, { "epoch": 0.36, "learning_rate": 1.4941158384419705e-05, "loss": 1.292, "step": 13015 }, { "epoch": 0.36, "learning_rate": 1.4940389378007296e-05, "loss": 1.3054, "step": 13016 }, { "epoch": 0.36, "learning_rate": 1.4939620332943605e-05, "loss": 1.3252, "step": 13017 }, { "epoch": 0.36, "learning_rate": 1.4938851249234645e-05, "loss": 1.6641, "step": 13018 }, { "epoch": 0.36, "learning_rate": 1.4938082126886438e-05, "loss": 1.2151, "step": 13019 }, { "epoch": 0.36, "learning_rate": 1.4937312965904995e-05, "loss": 1.2869, "step": 13020 }, { "epoch": 0.36, "learning_rate": 1.493654376629634e-05, "loss": 1.3577, "step": 13021 }, { "epoch": 0.36, "learning_rate": 1.4935774528066486e-05, "loss": 1.2122, "step": 13022 }, { "epoch": 0.36, "learning_rate": 1.4935005251221455e-05, "loss": 1.2949, "step": 13023 }, { "epoch": 0.36, "learning_rate": 1.4934235935767262e-05, "loss": 1.177, "step": 13024 }, { "epoch": 0.36, "learning_rate": 1.4933466581709928e-05, "loss": 1.3826, "step": 13025 }, { "epoch": 0.36, "learning_rate": 1.4932697189055474e-05, "loss": 1.4565, "step": 13026 }, { "epoch": 0.36, "learning_rate": 1.4931927757809912e-05, "loss": 1.3232, "step": 13027 }, { "epoch": 0.36, "learning_rate": 1.4931158287979268e-05, "loss": 1.4204, "step": 13028 }, { "epoch": 0.36, "learning_rate": 1.493038877956956e-05, "loss": 1.3433, "step": 13029 }, { "epoch": 0.36, "learning_rate": 1.4929619232586811e-05, "loss": 1.3267, "step": 13030 }, { "epoch": 0.36, "learning_rate": 1.4928849647037038e-05, "loss": 1.2188, "step": 13031 }, { "epoch": 0.36, "learning_rate": 1.4928080022926264e-05, "loss": 1.3162, "step": 13032 }, { "epoch": 0.36, "learning_rate": 1.4927310360260505e-05, "loss": 1.3516, "step": 13033 }, { "epoch": 0.36, "learning_rate": 1.492654065904579e-05, "loss": 1.3083, "step": 13034 }, { "epoch": 0.36, "learning_rate": 1.4925770919288134e-05, "loss": 1.3303, "step": 13035 }, { "epoch": 0.36, "learning_rate": 1.4925001140993569e-05, "loss": 1.3174, "step": 13036 }, { "epoch": 0.36, "learning_rate": 1.4924231324168106e-05, "loss": 1.1436, "step": 13037 }, { "epoch": 0.36, "learning_rate": 1.4923461468817775e-05, "loss": 1.2354, "step": 13038 }, { "epoch": 0.36, "learning_rate": 1.4922691574948596e-05, "loss": 1.3369, "step": 13039 }, { "epoch": 0.36, "learning_rate": 1.4921921642566593e-05, "loss": 1.4253, "step": 13040 }, { "epoch": 0.36, "learning_rate": 1.4921151671677789e-05, "loss": 1.1807, "step": 13041 }, { "epoch": 0.36, "learning_rate": 1.492038166228821e-05, "loss": 1.4197, "step": 13042 }, { "epoch": 0.36, "learning_rate": 1.4919611614403875e-05, "loss": 1.3569, "step": 13043 }, { "epoch": 0.36, "learning_rate": 1.4918841528030816e-05, "loss": 1.3137, "step": 13044 }, { "epoch": 0.36, "learning_rate": 1.4918071403175051e-05, "loss": 1.2373, "step": 13045 }, { "epoch": 0.36, "learning_rate": 1.4917301239842612e-05, "loss": 1.4048, "step": 13046 }, { "epoch": 0.36, "learning_rate": 1.4916531038039516e-05, "loss": 1.3032, "step": 13047 }, { "epoch": 0.36, "learning_rate": 1.4915760797771794e-05, "loss": 1.3445, "step": 13048 }, { "epoch": 0.36, "learning_rate": 1.491499051904547e-05, "loss": 1.8247, "step": 13049 }, { "epoch": 0.36, "learning_rate": 1.4914220201866574e-05, "loss": 1.4944, "step": 13050 }, { "epoch": 0.36, "learning_rate": 1.4913449846241128e-05, "loss": 1.4136, "step": 13051 }, { "epoch": 0.36, "learning_rate": 1.4912679452175166e-05, "loss": 1.2854, "step": 13052 }, { "epoch": 0.36, "learning_rate": 1.4911909019674703e-05, "loss": 1.3074, "step": 13053 }, { "epoch": 0.36, "learning_rate": 1.4911138548745778e-05, "loss": 1.3525, "step": 13054 }, { "epoch": 0.36, "learning_rate": 1.4910368039394411e-05, "loss": 1.3381, "step": 13055 }, { "epoch": 0.36, "learning_rate": 1.4909597491626637e-05, "loss": 1.2314, "step": 13056 }, { "epoch": 0.36, "learning_rate": 1.490882690544848e-05, "loss": 1.374, "step": 13057 }, { "epoch": 0.36, "learning_rate": 1.490805628086597e-05, "loss": 1.2402, "step": 13058 }, { "epoch": 0.36, "learning_rate": 1.4907285617885134e-05, "loss": 1.2456, "step": 13059 }, { "epoch": 0.36, "learning_rate": 1.4906514916512004e-05, "loss": 1.4048, "step": 13060 }, { "epoch": 0.36, "learning_rate": 1.4905744176752609e-05, "loss": 1.3796, "step": 13061 }, { "epoch": 0.36, "learning_rate": 1.4904973398612976e-05, "loss": 1.3088, "step": 13062 }, { "epoch": 0.36, "learning_rate": 1.4904202582099138e-05, "loss": 1.1758, "step": 13063 }, { "epoch": 0.36, "learning_rate": 1.4903431727217128e-05, "loss": 1.3623, "step": 13064 }, { "epoch": 0.36, "learning_rate": 1.490266083397297e-05, "loss": 1.302, "step": 13065 }, { "epoch": 0.36, "learning_rate": 1.4901889902372702e-05, "loss": 1.2571, "step": 13066 }, { "epoch": 0.36, "learning_rate": 1.4901118932422352e-05, "loss": 1.304, "step": 13067 }, { "epoch": 0.36, "learning_rate": 1.4900347924127952e-05, "loss": 1.196, "step": 13068 }, { "epoch": 0.36, "learning_rate": 1.4899576877495533e-05, "loss": 1.2161, "step": 13069 }, { "epoch": 0.36, "learning_rate": 1.4898805792531128e-05, "loss": 1.3669, "step": 13070 }, { "epoch": 0.36, "learning_rate": 1.4898034669240772e-05, "loss": 1.2368, "step": 13071 }, { "epoch": 0.36, "learning_rate": 1.4897263507630495e-05, "loss": 1.376, "step": 13072 }, { "epoch": 0.36, "learning_rate": 1.4896492307706335e-05, "loss": 1.4736, "step": 13073 }, { "epoch": 0.36, "learning_rate": 1.4895721069474314e-05, "loss": 1.2344, "step": 13074 }, { "epoch": 0.36, "learning_rate": 1.4894949792940479e-05, "loss": 1.3362, "step": 13075 }, { "epoch": 0.36, "learning_rate": 1.4894178478110856e-05, "loss": 1.3123, "step": 13076 }, { "epoch": 0.36, "learning_rate": 1.4893407124991486e-05, "loss": 1.323, "step": 13077 }, { "epoch": 0.36, "learning_rate": 1.4892635733588394e-05, "loss": 1.3359, "step": 13078 }, { "epoch": 0.36, "learning_rate": 1.4891864303907626e-05, "loss": 1.2739, "step": 13079 }, { "epoch": 0.36, "learning_rate": 1.4891092835955208e-05, "loss": 1.1863, "step": 13080 }, { "epoch": 0.36, "learning_rate": 1.4890321329737181e-05, "loss": 1.2559, "step": 13081 }, { "epoch": 0.36, "learning_rate": 1.4889549785259577e-05, "loss": 1.3765, "step": 13082 }, { "epoch": 0.36, "learning_rate": 1.488877820252844e-05, "loss": 1.3772, "step": 13083 }, { "epoch": 0.36, "learning_rate": 1.48880065815498e-05, "loss": 1.1826, "step": 13084 }, { "epoch": 0.36, "learning_rate": 1.4887234922329692e-05, "loss": 1.4236, "step": 13085 }, { "epoch": 0.36, "learning_rate": 1.4886463224874157e-05, "loss": 1.3992, "step": 13086 }, { "epoch": 0.36, "learning_rate": 1.4885691489189233e-05, "loss": 1.792, "step": 13087 }, { "epoch": 0.36, "learning_rate": 1.4884919715280954e-05, "loss": 1.3423, "step": 13088 }, { "epoch": 0.36, "learning_rate": 1.4884147903155364e-05, "loss": 1.2305, "step": 13089 }, { "epoch": 0.36, "learning_rate": 1.4883376052818494e-05, "loss": 1.4343, "step": 13090 }, { "epoch": 0.36, "learning_rate": 1.4882604164276388e-05, "loss": 1.2898, "step": 13091 }, { "epoch": 0.36, "learning_rate": 1.488183223753508e-05, "loss": 1.1724, "step": 13092 }, { "epoch": 0.36, "learning_rate": 1.4881060272600616e-05, "loss": 1.3494, "step": 13093 }, { "epoch": 0.36, "learning_rate": 1.488028826947903e-05, "loss": 1.4238, "step": 13094 }, { "epoch": 0.36, "learning_rate": 1.4879516228176365e-05, "loss": 1.4192, "step": 13095 }, { "epoch": 0.36, "learning_rate": 1.4878744148698656e-05, "loss": 1.2944, "step": 13096 }, { "epoch": 0.36, "learning_rate": 1.4877972031051949e-05, "loss": 1.3435, "step": 13097 }, { "epoch": 0.36, "learning_rate": 1.4877199875242281e-05, "loss": 1.2888, "step": 13098 }, { "epoch": 0.36, "learning_rate": 1.4876427681275699e-05, "loss": 1.4031, "step": 13099 }, { "epoch": 0.36, "learning_rate": 1.4875655449158235e-05, "loss": 1.384, "step": 13100 }, { "epoch": 0.36, "learning_rate": 1.4874883178895938e-05, "loss": 1.3735, "step": 13101 }, { "epoch": 0.36, "learning_rate": 1.4874110870494846e-05, "loss": 1.4731, "step": 13102 }, { "epoch": 0.36, "learning_rate": 1.4873338523961004e-05, "loss": 1.3123, "step": 13103 }, { "epoch": 0.36, "learning_rate": 1.4872566139300453e-05, "loss": 1.2461, "step": 13104 }, { "epoch": 0.36, "learning_rate": 1.4871793716519234e-05, "loss": 1.1941, "step": 13105 }, { "epoch": 0.36, "learning_rate": 1.4871021255623394e-05, "loss": 1.6084, "step": 13106 }, { "epoch": 0.36, "learning_rate": 1.4870248756618972e-05, "loss": 1.2871, "step": 13107 }, { "epoch": 0.36, "learning_rate": 1.4869476219512015e-05, "loss": 1.3247, "step": 13108 }, { "epoch": 0.36, "learning_rate": 1.4868703644308568e-05, "loss": 1.356, "step": 13109 }, { "epoch": 0.36, "learning_rate": 1.486793103101467e-05, "loss": 1.322, "step": 13110 }, { "epoch": 0.36, "learning_rate": 1.4867158379636371e-05, "loss": 1.343, "step": 13111 }, { "epoch": 0.36, "learning_rate": 1.4866385690179709e-05, "loss": 1.2754, "step": 13112 }, { "epoch": 0.36, "learning_rate": 1.4865612962650737e-05, "loss": 1.2871, "step": 13113 }, { "epoch": 0.36, "learning_rate": 1.48648401970555e-05, "loss": 1.3613, "step": 13114 }, { "epoch": 0.36, "learning_rate": 1.4864067393400036e-05, "loss": 1.4199, "step": 13115 }, { "epoch": 0.36, "learning_rate": 1.48632945516904e-05, "loss": 1.2927, "step": 13116 }, { "epoch": 0.36, "learning_rate": 1.486252167193263e-05, "loss": 1.1848, "step": 13117 }, { "epoch": 0.36, "learning_rate": 1.4861748754132781e-05, "loss": 1.2668, "step": 13118 }, { "epoch": 0.36, "learning_rate": 1.4860975798296893e-05, "loss": 1.2722, "step": 13119 }, { "epoch": 0.36, "learning_rate": 1.486020280443102e-05, "loss": 1.3376, "step": 13120 }, { "epoch": 0.36, "learning_rate": 1.48594297725412e-05, "loss": 1.2305, "step": 13121 }, { "epoch": 0.36, "learning_rate": 1.485865670263349e-05, "loss": 1.3704, "step": 13122 }, { "epoch": 0.36, "learning_rate": 1.4857883594713934e-05, "loss": 1.4705, "step": 13123 }, { "epoch": 0.36, "learning_rate": 1.4857110448788584e-05, "loss": 1.355, "step": 13124 }, { "epoch": 0.36, "learning_rate": 1.485633726486348e-05, "loss": 1.2615, "step": 13125 }, { "epoch": 0.36, "learning_rate": 1.4855564042944681e-05, "loss": 1.1787, "step": 13126 }, { "epoch": 0.36, "learning_rate": 1.485479078303823e-05, "loss": 1.4319, "step": 13127 }, { "epoch": 0.36, "learning_rate": 1.4854017485150181e-05, "loss": 1.2749, "step": 13128 }, { "epoch": 0.36, "learning_rate": 1.4853244149286578e-05, "loss": 1.3801, "step": 13129 }, { "epoch": 0.36, "learning_rate": 1.4852470775453478e-05, "loss": 1.4526, "step": 13130 }, { "epoch": 0.36, "learning_rate": 1.4851697363656927e-05, "loss": 1.2739, "step": 13131 }, { "epoch": 0.36, "learning_rate": 1.485092391390298e-05, "loss": 1.2878, "step": 13132 }, { "epoch": 0.36, "learning_rate": 1.4850150426197682e-05, "loss": 1.2983, "step": 13133 }, { "epoch": 0.36, "learning_rate": 1.484937690054709e-05, "loss": 1.3298, "step": 13134 }, { "epoch": 0.36, "learning_rate": 1.4848603336957252e-05, "loss": 1.2102, "step": 13135 }, { "epoch": 0.36, "learning_rate": 1.4847829735434225e-05, "loss": 1.1897, "step": 13136 }, { "epoch": 0.36, "learning_rate": 1.4847056095984054e-05, "loss": 1.4053, "step": 13137 }, { "epoch": 0.36, "learning_rate": 1.4846282418612796e-05, "loss": 1.3962, "step": 13138 }, { "epoch": 0.36, "learning_rate": 1.4845508703326504e-05, "loss": 1.3218, "step": 13139 }, { "epoch": 0.36, "learning_rate": 1.484473495013123e-05, "loss": 1.3062, "step": 13140 }, { "epoch": 0.36, "learning_rate": 1.4843961159033027e-05, "loss": 1.394, "step": 13141 }, { "epoch": 0.36, "learning_rate": 1.4843187330037951e-05, "loss": 1.3975, "step": 13142 }, { "epoch": 0.36, "learning_rate": 1.4842413463152052e-05, "loss": 1.3193, "step": 13143 }, { "epoch": 0.36, "learning_rate": 1.484163955838139e-05, "loss": 1.4019, "step": 13144 }, { "epoch": 0.36, "learning_rate": 1.4840865615732017e-05, "loss": 1.4951, "step": 13145 }, { "epoch": 0.36, "learning_rate": 1.4840091635209988e-05, "loss": 1.2769, "step": 13146 }, { "epoch": 0.36, "learning_rate": 1.4839317616821356e-05, "loss": 1.3518, "step": 13147 }, { "epoch": 0.36, "learning_rate": 1.4838543560572181e-05, "loss": 1.3269, "step": 13148 }, { "epoch": 0.36, "learning_rate": 1.4837769466468514e-05, "loss": 1.2695, "step": 13149 }, { "epoch": 0.36, "learning_rate": 1.4836995334516415e-05, "loss": 1.3535, "step": 13150 }, { "epoch": 0.36, "learning_rate": 1.4836221164721938e-05, "loss": 1.3323, "step": 13151 }, { "epoch": 0.36, "learning_rate": 1.4835446957091143e-05, "loss": 1.3169, "step": 13152 }, { "epoch": 0.36, "learning_rate": 1.4834672711630083e-05, "loss": 1.3887, "step": 13153 }, { "epoch": 0.36, "learning_rate": 1.4833898428344817e-05, "loss": 1.4624, "step": 13154 }, { "epoch": 0.36, "learning_rate": 1.4833124107241404e-05, "loss": 1.3123, "step": 13155 }, { "epoch": 0.36, "learning_rate": 1.4832349748325898e-05, "loss": 1.4609, "step": 13156 }, { "epoch": 0.36, "learning_rate": 1.4831575351604361e-05, "loss": 1.3975, "step": 13157 }, { "epoch": 0.36, "learning_rate": 1.4830800917082852e-05, "loss": 1.2639, "step": 13158 }, { "epoch": 0.36, "learning_rate": 1.4830026444767427e-05, "loss": 1.3396, "step": 13159 }, { "epoch": 0.36, "learning_rate": 1.4829251934664147e-05, "loss": 1.2825, "step": 13160 }, { "epoch": 0.36, "learning_rate": 1.482847738677907e-05, "loss": 1.3826, "step": 13161 }, { "epoch": 0.36, "learning_rate": 1.4827702801118258e-05, "loss": 1.3108, "step": 13162 }, { "epoch": 0.36, "learning_rate": 1.482692817768777e-05, "loss": 1.2808, "step": 13163 }, { "epoch": 0.36, "learning_rate": 1.4826153516493663e-05, "loss": 1.4048, "step": 13164 }, { "epoch": 0.36, "learning_rate": 1.4825378817541998e-05, "loss": 1.1992, "step": 13165 }, { "epoch": 0.36, "learning_rate": 1.4824604080838842e-05, "loss": 1.4121, "step": 13166 }, { "epoch": 0.36, "learning_rate": 1.4823829306390251e-05, "loss": 1.2483, "step": 13167 }, { "epoch": 0.36, "learning_rate": 1.482305449420229e-05, "loss": 1.2188, "step": 13168 }, { "epoch": 0.36, "learning_rate": 1.4822279644281017e-05, "loss": 1.3079, "step": 13169 }, { "epoch": 0.36, "learning_rate": 1.4821504756632497e-05, "loss": 1.4362, "step": 13170 }, { "epoch": 0.36, "learning_rate": 1.4820729831262791e-05, "loss": 1.363, "step": 13171 }, { "epoch": 0.36, "learning_rate": 1.4819954868177959e-05, "loss": 1.3184, "step": 13172 }, { "epoch": 0.36, "learning_rate": 1.4819179867384069e-05, "loss": 1.2976, "step": 13173 }, { "epoch": 0.36, "learning_rate": 1.481840482888718e-05, "loss": 1.4114, "step": 13174 }, { "epoch": 0.36, "learning_rate": 1.4817629752693358e-05, "loss": 1.4448, "step": 13175 }, { "epoch": 0.36, "learning_rate": 1.4816854638808667e-05, "loss": 1.3347, "step": 13176 }, { "epoch": 0.36, "learning_rate": 1.481607948723917e-05, "loss": 1.2915, "step": 13177 }, { "epoch": 0.36, "learning_rate": 1.481530429799093e-05, "loss": 1.283, "step": 13178 }, { "epoch": 0.36, "learning_rate": 1.4814529071070018e-05, "loss": 1.3921, "step": 13179 }, { "epoch": 0.36, "learning_rate": 1.4813753806482492e-05, "loss": 1.2429, "step": 13180 }, { "epoch": 0.36, "learning_rate": 1.481297850423442e-05, "loss": 1.2256, "step": 13181 }, { "epoch": 0.36, "learning_rate": 1.4812203164331866e-05, "loss": 1.3474, "step": 13182 }, { "epoch": 0.36, "learning_rate": 1.4811427786780899e-05, "loss": 1.2744, "step": 13183 }, { "epoch": 0.36, "learning_rate": 1.4810652371587581e-05, "loss": 1.4614, "step": 13184 }, { "epoch": 0.36, "learning_rate": 1.4809876918757984e-05, "loss": 1.1254, "step": 13185 }, { "epoch": 0.36, "learning_rate": 1.480910142829817e-05, "loss": 1.3457, "step": 13186 }, { "epoch": 0.36, "learning_rate": 1.4808325900214211e-05, "loss": 1.1934, "step": 13187 }, { "epoch": 0.36, "learning_rate": 1.4807550334512166e-05, "loss": 1.3206, "step": 13188 }, { "epoch": 0.36, "learning_rate": 1.4806774731198113e-05, "loss": 1.3652, "step": 13189 }, { "epoch": 0.36, "learning_rate": 1.4805999090278107e-05, "loss": 1.4299, "step": 13190 }, { "epoch": 0.36, "learning_rate": 1.4805223411758231e-05, "loss": 1.3342, "step": 13191 }, { "epoch": 0.36, "learning_rate": 1.4804447695644543e-05, "loss": 0.9937, "step": 13192 }, { "epoch": 0.36, "learning_rate": 1.480367194194312e-05, "loss": 1.4771, "step": 13193 }, { "epoch": 0.36, "learning_rate": 1.4802896150660022e-05, "loss": 1.2568, "step": 13194 }, { "epoch": 0.36, "learning_rate": 1.4802120321801328e-05, "loss": 1.291, "step": 13195 }, { "epoch": 0.36, "learning_rate": 1.4801344455373097e-05, "loss": 1.7974, "step": 13196 }, { "epoch": 0.36, "learning_rate": 1.4800568551381409e-05, "loss": 1.3911, "step": 13197 }, { "epoch": 0.36, "learning_rate": 1.4799792609832326e-05, "loss": 1.3481, "step": 13198 }, { "epoch": 0.36, "learning_rate": 1.4799016630731928e-05, "loss": 1.1414, "step": 13199 }, { "epoch": 0.36, "learning_rate": 1.4798240614086274e-05, "loss": 1.2864, "step": 13200 }, { "epoch": 0.36, "learning_rate": 1.4797464559901448e-05, "loss": 1.4172, "step": 13201 }, { "epoch": 0.36, "learning_rate": 1.4796688468183512e-05, "loss": 1.356, "step": 13202 }, { "epoch": 0.36, "learning_rate": 1.4795912338938543e-05, "loss": 1.2073, "step": 13203 }, { "epoch": 0.36, "learning_rate": 1.4795136172172608e-05, "loss": 1.2651, "step": 13204 }, { "epoch": 0.36, "learning_rate": 1.4794359967891782e-05, "loss": 1.3684, "step": 13205 }, { "epoch": 0.36, "learning_rate": 1.4793583726102138e-05, "loss": 1.3992, "step": 13206 }, { "epoch": 0.36, "learning_rate": 1.4792807446809754e-05, "loss": 1.1628, "step": 13207 }, { "epoch": 0.36, "learning_rate": 1.4792031130020694e-05, "loss": 1.4375, "step": 13208 }, { "epoch": 0.36, "learning_rate": 1.4791254775741038e-05, "loss": 1.4187, "step": 13209 }, { "epoch": 0.36, "learning_rate": 1.4790478383976857e-05, "loss": 1.373, "step": 13210 }, { "epoch": 0.36, "learning_rate": 1.4789701954734226e-05, "loss": 1.1943, "step": 13211 }, { "epoch": 0.36, "learning_rate": 1.4788925488019217e-05, "loss": 1.4602, "step": 13212 }, { "epoch": 0.36, "learning_rate": 1.4788148983837909e-05, "loss": 1.4189, "step": 13213 }, { "epoch": 0.36, "learning_rate": 1.4787372442196374e-05, "loss": 1.3372, "step": 13214 }, { "epoch": 0.36, "learning_rate": 1.478659586310069e-05, "loss": 1.1885, "step": 13215 }, { "epoch": 0.36, "learning_rate": 1.4785819246556929e-05, "loss": 1.355, "step": 13216 }, { "epoch": 0.36, "learning_rate": 1.478504259257117e-05, "loss": 1.4199, "step": 13217 }, { "epoch": 0.36, "learning_rate": 1.4784265901149487e-05, "loss": 1.3081, "step": 13218 }, { "epoch": 0.36, "learning_rate": 1.4783489172297958e-05, "loss": 1.2354, "step": 13219 }, { "epoch": 0.36, "learning_rate": 1.4782712406022658e-05, "loss": 1.4302, "step": 13220 }, { "epoch": 0.36, "learning_rate": 1.4781935602329664e-05, "loss": 1.2954, "step": 13221 }, { "epoch": 0.36, "learning_rate": 1.4781158761225056e-05, "loss": 1.3738, "step": 13222 }, { "epoch": 0.36, "learning_rate": 1.478038188271491e-05, "loss": 1.2925, "step": 13223 }, { "epoch": 0.36, "learning_rate": 1.4779604966805306e-05, "loss": 1.312, "step": 13224 }, { "epoch": 0.36, "learning_rate": 1.4778828013502318e-05, "loss": 1.1646, "step": 13225 }, { "epoch": 0.36, "learning_rate": 1.4778051022812028e-05, "loss": 1.1345, "step": 13226 }, { "epoch": 0.36, "learning_rate": 1.477727399474051e-05, "loss": 1.3853, "step": 13227 }, { "epoch": 0.36, "learning_rate": 1.477649692929385e-05, "loss": 1.4238, "step": 13228 }, { "epoch": 0.36, "learning_rate": 1.4775719826478123e-05, "loss": 1.3462, "step": 13229 }, { "epoch": 0.36, "learning_rate": 1.4774942686299412e-05, "loss": 1.3401, "step": 13230 }, { "epoch": 0.36, "learning_rate": 1.4774165508763791e-05, "loss": 1.3247, "step": 13231 }, { "epoch": 0.36, "learning_rate": 1.4773388293877348e-05, "loss": 1.2761, "step": 13232 }, { "epoch": 0.36, "learning_rate": 1.4772611041646157e-05, "loss": 1.3196, "step": 13233 }, { "epoch": 0.36, "learning_rate": 1.4771833752076303e-05, "loss": 1.2754, "step": 13234 }, { "epoch": 0.36, "learning_rate": 1.4771056425173864e-05, "loss": 1.3203, "step": 13235 }, { "epoch": 0.36, "learning_rate": 1.4770279060944923e-05, "loss": 1.1899, "step": 13236 }, { "epoch": 0.36, "learning_rate": 1.4769501659395562e-05, "loss": 1.1982, "step": 13237 }, { "epoch": 0.36, "learning_rate": 1.4768724220531865e-05, "loss": 1.2593, "step": 13238 }, { "epoch": 0.36, "learning_rate": 1.4767946744359908e-05, "loss": 1.7437, "step": 13239 }, { "epoch": 0.36, "learning_rate": 1.4767169230885782e-05, "loss": 1.4448, "step": 13240 }, { "epoch": 0.36, "learning_rate": 1.4766391680115564e-05, "loss": 1.2886, "step": 13241 }, { "epoch": 0.36, "learning_rate": 1.4765614092055339e-05, "loss": 1.2566, "step": 13242 }, { "epoch": 0.36, "learning_rate": 1.4764836466711188e-05, "loss": 1.2163, "step": 13243 }, { "epoch": 0.36, "learning_rate": 1.47640588040892e-05, "loss": 1.4275, "step": 13244 }, { "epoch": 0.36, "learning_rate": 1.4763281104195455e-05, "loss": 1.363, "step": 13245 }, { "epoch": 0.36, "learning_rate": 1.4762503367036038e-05, "loss": 1.3374, "step": 13246 }, { "epoch": 0.36, "learning_rate": 1.4761725592617035e-05, "loss": 1.2771, "step": 13247 }, { "epoch": 0.36, "learning_rate": 1.4760947780944533e-05, "loss": 1.4014, "step": 13248 }, { "epoch": 0.36, "learning_rate": 1.476016993202461e-05, "loss": 1.405, "step": 13249 }, { "epoch": 0.36, "learning_rate": 1.4759392045863357e-05, "loss": 1.2856, "step": 13250 }, { "epoch": 0.36, "learning_rate": 1.4758614122466857e-05, "loss": 1.2869, "step": 13251 }, { "epoch": 0.36, "learning_rate": 1.47578361618412e-05, "loss": 1.3015, "step": 13252 }, { "epoch": 0.36, "learning_rate": 1.4757058163992466e-05, "loss": 1.2698, "step": 13253 }, { "epoch": 0.36, "learning_rate": 1.4756280128926753e-05, "loss": 1.3298, "step": 13254 }, { "epoch": 0.36, "learning_rate": 1.4755502056650134e-05, "loss": 1.2883, "step": 13255 }, { "epoch": 0.36, "learning_rate": 1.4754723947168707e-05, "loss": 1.2324, "step": 13256 }, { "epoch": 0.36, "learning_rate": 1.4753945800488555e-05, "loss": 1.437, "step": 13257 }, { "epoch": 0.36, "learning_rate": 1.4753167616615768e-05, "loss": 1.4448, "step": 13258 }, { "epoch": 0.36, "learning_rate": 1.475238939555643e-05, "loss": 1.3105, "step": 13259 }, { "epoch": 0.36, "learning_rate": 1.4751611137316634e-05, "loss": 1.3237, "step": 13260 }, { "epoch": 0.36, "learning_rate": 1.4750832841902467e-05, "loss": 1.2722, "step": 13261 }, { "epoch": 0.36, "learning_rate": 1.4750054509320017e-05, "loss": 1.2417, "step": 13262 }, { "epoch": 0.36, "learning_rate": 1.4749276139575372e-05, "loss": 1.2148, "step": 13263 }, { "epoch": 0.36, "learning_rate": 1.4748497732674629e-05, "loss": 1.3496, "step": 13264 }, { "epoch": 0.36, "learning_rate": 1.4747719288623868e-05, "loss": 1.2876, "step": 13265 }, { "epoch": 0.36, "learning_rate": 1.4746940807429187e-05, "loss": 1.2107, "step": 13266 }, { "epoch": 0.36, "learning_rate": 1.474616228909667e-05, "loss": 1.272, "step": 13267 }, { "epoch": 0.36, "learning_rate": 1.4745383733632413e-05, "loss": 1.417, "step": 13268 }, { "epoch": 0.36, "learning_rate": 1.4744605141042505e-05, "loss": 1.3315, "step": 13269 }, { "epoch": 0.36, "learning_rate": 1.4743826511333037e-05, "loss": 1.4717, "step": 13270 }, { "epoch": 0.36, "learning_rate": 1.4743047844510101e-05, "loss": 1.2756, "step": 13271 }, { "epoch": 0.36, "learning_rate": 1.4742269140579788e-05, "loss": 1.374, "step": 13272 }, { "epoch": 0.36, "learning_rate": 1.4741490399548193e-05, "loss": 1.2751, "step": 13273 }, { "epoch": 0.36, "learning_rate": 1.4740711621421406e-05, "loss": 1.3105, "step": 13274 }, { "epoch": 0.36, "learning_rate": 1.473993280620552e-05, "loss": 1.2532, "step": 13275 }, { "epoch": 0.36, "learning_rate": 1.473915395390663e-05, "loss": 1.2937, "step": 13276 }, { "epoch": 0.36, "learning_rate": 1.4738375064530828e-05, "loss": 1.5076, "step": 13277 }, { "epoch": 0.36, "learning_rate": 1.4737596138084207e-05, "loss": 1.4829, "step": 13278 }, { "epoch": 0.36, "learning_rate": 1.4736817174572861e-05, "loss": 1.3533, "step": 13279 }, { "epoch": 0.36, "learning_rate": 1.4736038174002886e-05, "loss": 1.385, "step": 13280 }, { "epoch": 0.36, "learning_rate": 1.4735259136380374e-05, "loss": 1.5029, "step": 13281 }, { "epoch": 0.36, "learning_rate": 1.4734480061711422e-05, "loss": 1.3074, "step": 13282 }, { "epoch": 0.36, "learning_rate": 1.4733700950002124e-05, "loss": 1.3374, "step": 13283 }, { "epoch": 0.36, "learning_rate": 1.4732921801258575e-05, "loss": 1.478, "step": 13284 }, { "epoch": 0.36, "learning_rate": 1.4732142615486873e-05, "loss": 1.3247, "step": 13285 }, { "epoch": 0.36, "learning_rate": 1.4731363392693112e-05, "loss": 1.1172, "step": 13286 }, { "epoch": 0.36, "learning_rate": 1.473058413288339e-05, "loss": 1.3979, "step": 13287 }, { "epoch": 0.36, "learning_rate": 1.47298048360638e-05, "loss": 1.3208, "step": 13288 }, { "epoch": 0.36, "learning_rate": 1.4729025502240442e-05, "loss": 1.2598, "step": 13289 }, { "epoch": 0.36, "learning_rate": 1.472824613141941e-05, "loss": 1.3672, "step": 13290 }, { "epoch": 0.36, "learning_rate": 1.4727466723606807e-05, "loss": 1.416, "step": 13291 }, { "epoch": 0.36, "learning_rate": 1.4726687278808725e-05, "loss": 1.3513, "step": 13292 }, { "epoch": 0.36, "learning_rate": 1.4725907797031268e-05, "loss": 1.3809, "step": 13293 }, { "epoch": 0.36, "learning_rate": 1.4725128278280526e-05, "loss": 1.3164, "step": 13294 }, { "epoch": 0.36, "learning_rate": 1.4724348722562604e-05, "loss": 1.3552, "step": 13295 }, { "epoch": 0.36, "learning_rate": 1.47235691298836e-05, "loss": 1.1807, "step": 13296 }, { "epoch": 0.36, "learning_rate": 1.4722789500249612e-05, "loss": 1.4326, "step": 13297 }, { "epoch": 0.36, "learning_rate": 1.4722009833666737e-05, "loss": 1.4707, "step": 13298 }, { "epoch": 0.36, "learning_rate": 1.472123013014108e-05, "loss": 1.2625, "step": 13299 }, { "epoch": 0.36, "learning_rate": 1.4720450389678738e-05, "loss": 1.3721, "step": 13300 }, { "epoch": 0.36, "learning_rate": 1.4719670612285813e-05, "loss": 1.3867, "step": 13301 }, { "epoch": 0.36, "learning_rate": 1.4718890797968404e-05, "loss": 1.1443, "step": 13302 }, { "epoch": 0.36, "learning_rate": 1.4718110946732613e-05, "loss": 1.5115, "step": 13303 }, { "epoch": 0.36, "learning_rate": 1.4717331058584538e-05, "loss": 1.2415, "step": 13304 }, { "epoch": 0.36, "learning_rate": 1.4716551133530285e-05, "loss": 1.168, "step": 13305 }, { "epoch": 0.36, "learning_rate": 1.4715771171575954e-05, "loss": 1.2256, "step": 13306 }, { "epoch": 0.36, "learning_rate": 1.4714991172727649e-05, "loss": 1.3501, "step": 13307 }, { "epoch": 0.36, "learning_rate": 1.4714211136991466e-05, "loss": 1.2336, "step": 13308 }, { "epoch": 0.36, "learning_rate": 1.4713431064373515e-05, "loss": 1.4072, "step": 13309 }, { "epoch": 0.36, "learning_rate": 1.4712650954879893e-05, "loss": 1.7041, "step": 13310 }, { "epoch": 0.36, "learning_rate": 1.4711870808516708e-05, "loss": 1.3372, "step": 13311 }, { "epoch": 0.36, "learning_rate": 1.4711090625290059e-05, "loss": 1.2827, "step": 13312 }, { "epoch": 0.36, "learning_rate": 1.4710310405206057e-05, "loss": 1.3459, "step": 13313 }, { "epoch": 0.36, "learning_rate": 1.4709530148270794e-05, "loss": 1.2664, "step": 13314 }, { "epoch": 0.36, "learning_rate": 1.4708749854490387e-05, "loss": 1.2126, "step": 13315 }, { "epoch": 0.36, "learning_rate": 1.4707969523870934e-05, "loss": 1.3137, "step": 13316 }, { "epoch": 0.36, "learning_rate": 1.4707189156418542e-05, "loss": 1.3096, "step": 13317 }, { "epoch": 0.36, "learning_rate": 1.4706408752139316e-05, "loss": 1.2231, "step": 13318 }, { "epoch": 0.36, "learning_rate": 1.4705628311039362e-05, "loss": 1.3735, "step": 13319 }, { "epoch": 0.36, "learning_rate": 1.470484783312478e-05, "loss": 1.3965, "step": 13320 }, { "epoch": 0.36, "learning_rate": 1.4704067318401684e-05, "loss": 1.2275, "step": 13321 }, { "epoch": 0.36, "learning_rate": 1.4703286766876178e-05, "loss": 1.2795, "step": 13322 }, { "epoch": 0.36, "learning_rate": 1.4702506178554367e-05, "loss": 1.3542, "step": 13323 }, { "epoch": 0.36, "learning_rate": 1.4701725553442358e-05, "loss": 1.6055, "step": 13324 }, { "epoch": 0.36, "learning_rate": 1.4700944891546262e-05, "loss": 1.2292, "step": 13325 }, { "epoch": 0.36, "learning_rate": 1.4700164192872182e-05, "loss": 1.3494, "step": 13326 }, { "epoch": 0.36, "learning_rate": 1.4699383457426229e-05, "loss": 1.3, "step": 13327 }, { "epoch": 0.36, "learning_rate": 1.4698602685214507e-05, "loss": 1.498, "step": 13328 }, { "epoch": 0.36, "learning_rate": 1.4697821876243128e-05, "loss": 1.3618, "step": 13329 }, { "epoch": 0.36, "learning_rate": 1.46970410305182e-05, "loss": 1.3748, "step": 13330 }, { "epoch": 0.36, "learning_rate": 1.469626014804583e-05, "loss": 1.2356, "step": 13331 }, { "epoch": 0.36, "learning_rate": 1.4695479228832132e-05, "loss": 1.2654, "step": 13332 }, { "epoch": 0.36, "learning_rate": 1.4694698272883212e-05, "loss": 1.2317, "step": 13333 }, { "epoch": 0.36, "learning_rate": 1.4693917280205179e-05, "loss": 1.3394, "step": 13334 }, { "epoch": 0.36, "learning_rate": 1.4693136250804145e-05, "loss": 1.4675, "step": 13335 }, { "epoch": 0.36, "learning_rate": 1.469235518468622e-05, "loss": 1.3035, "step": 13336 }, { "epoch": 0.36, "learning_rate": 1.4691574081857514e-05, "loss": 1.3789, "step": 13337 }, { "epoch": 0.36, "learning_rate": 1.4690792942324138e-05, "loss": 1.225, "step": 13338 }, { "epoch": 0.36, "learning_rate": 1.4690011766092205e-05, "loss": 1.4116, "step": 13339 }, { "epoch": 0.36, "learning_rate": 1.4689230553167826e-05, "loss": 1.2278, "step": 13340 }, { "epoch": 0.36, "learning_rate": 1.468844930355711e-05, "loss": 1.3069, "step": 13341 }, { "epoch": 0.36, "learning_rate": 1.4687668017266173e-05, "loss": 1.2668, "step": 13342 }, { "epoch": 0.36, "learning_rate": 1.4686886694301126e-05, "loss": 1.342, "step": 13343 }, { "epoch": 0.36, "learning_rate": 1.4686105334668081e-05, "loss": 1.2515, "step": 13344 }, { "epoch": 0.36, "learning_rate": 1.4685323938373146e-05, "loss": 1.4258, "step": 13345 }, { "epoch": 0.36, "learning_rate": 1.4684542505422448e-05, "loss": 1.4004, "step": 13346 }, { "epoch": 0.36, "learning_rate": 1.4683761035822089e-05, "loss": 1.3635, "step": 13347 }, { "epoch": 0.36, "learning_rate": 1.4682979529578186e-05, "loss": 1.4553, "step": 13348 }, { "epoch": 0.36, "learning_rate": 1.468219798669685e-05, "loss": 1.3262, "step": 13349 }, { "epoch": 0.36, "learning_rate": 1.4681416407184203e-05, "loss": 1.1584, "step": 13350 }, { "epoch": 0.36, "learning_rate": 1.4680634791046356e-05, "loss": 1.7065, "step": 13351 }, { "epoch": 0.36, "learning_rate": 1.4679853138289421e-05, "loss": 1.2659, "step": 13352 }, { "epoch": 0.36, "learning_rate": 1.4679071448919517e-05, "loss": 1.2344, "step": 13353 }, { "epoch": 0.36, "learning_rate": 1.4678289722942757e-05, "loss": 1.4617, "step": 13354 }, { "epoch": 0.36, "learning_rate": 1.4677507960365258e-05, "loss": 1.3691, "step": 13355 }, { "epoch": 0.36, "learning_rate": 1.4676726161193137e-05, "loss": 1.4446, "step": 13356 }, { "epoch": 0.36, "learning_rate": 1.4675944325432511e-05, "loss": 1.2964, "step": 13357 }, { "epoch": 0.36, "learning_rate": 1.4675162453089495e-05, "loss": 1.2839, "step": 13358 }, { "epoch": 0.36, "learning_rate": 1.4674380544170203e-05, "loss": 1.2935, "step": 13359 }, { "epoch": 0.36, "learning_rate": 1.4673598598680758e-05, "loss": 1.2681, "step": 13360 }, { "epoch": 0.36, "learning_rate": 1.4672816616627275e-05, "loss": 1.386, "step": 13361 }, { "epoch": 0.36, "learning_rate": 1.4672034598015872e-05, "loss": 1.3931, "step": 13362 }, { "epoch": 0.36, "learning_rate": 1.4671252542852667e-05, "loss": 1.3901, "step": 13363 }, { "epoch": 0.36, "learning_rate": 1.467047045114378e-05, "loss": 1.3123, "step": 13364 }, { "epoch": 0.36, "learning_rate": 1.4669688322895327e-05, "loss": 1.1268, "step": 13365 }, { "epoch": 0.37, "learning_rate": 1.4668906158113432e-05, "loss": 1.3018, "step": 13366 }, { "epoch": 0.37, "learning_rate": 1.4668123956804205e-05, "loss": 1.3953, "step": 13367 }, { "epoch": 0.37, "learning_rate": 1.4667341718973776e-05, "loss": 1.3284, "step": 13368 }, { "epoch": 0.37, "learning_rate": 1.4666559444628257e-05, "loss": 1.4629, "step": 13369 }, { "epoch": 0.37, "learning_rate": 1.4665777133773773e-05, "loss": 1.384, "step": 13370 }, { "epoch": 0.37, "learning_rate": 1.4664994786416442e-05, "loss": 1.3467, "step": 13371 }, { "epoch": 0.37, "learning_rate": 1.4664212402562388e-05, "loss": 1.3604, "step": 13372 }, { "epoch": 0.37, "learning_rate": 1.4663429982217725e-05, "loss": 1.3245, "step": 13373 }, { "epoch": 0.37, "learning_rate": 1.4662647525388582e-05, "loss": 1.2927, "step": 13374 }, { "epoch": 0.37, "learning_rate": 1.4661865032081075e-05, "loss": 1.177, "step": 13375 }, { "epoch": 0.37, "learning_rate": 1.4661082502301329e-05, "loss": 1.7212, "step": 13376 }, { "epoch": 0.37, "learning_rate": 1.4660299936055466e-05, "loss": 1.1082, "step": 13377 }, { "epoch": 0.37, "learning_rate": 1.4659517333349607e-05, "loss": 1.3159, "step": 13378 }, { "epoch": 0.37, "learning_rate": 1.4658734694189876e-05, "loss": 1.3032, "step": 13379 }, { "epoch": 0.37, "learning_rate": 1.4657952018582395e-05, "loss": 1.4697, "step": 13380 }, { "epoch": 0.37, "learning_rate": 1.4657169306533288e-05, "loss": 1.3623, "step": 13381 }, { "epoch": 0.37, "learning_rate": 1.4656386558048678e-05, "loss": 1.2917, "step": 13382 }, { "epoch": 0.37, "learning_rate": 1.465560377313469e-05, "loss": 1.3665, "step": 13383 }, { "epoch": 0.37, "learning_rate": 1.4654820951797445e-05, "loss": 1.2434, "step": 13384 }, { "epoch": 0.37, "learning_rate": 1.4654038094043073e-05, "loss": 1.3665, "step": 13385 }, { "epoch": 0.37, "learning_rate": 1.4653255199877694e-05, "loss": 1.5029, "step": 13386 }, { "epoch": 0.37, "learning_rate": 1.4652472269307433e-05, "loss": 1.4111, "step": 13387 }, { "epoch": 0.37, "learning_rate": 1.465168930233842e-05, "loss": 1.3223, "step": 13388 }, { "epoch": 0.37, "learning_rate": 1.4650906298976774e-05, "loss": 1.4346, "step": 13389 }, { "epoch": 0.37, "learning_rate": 1.4650123259228626e-05, "loss": 1.3301, "step": 13390 }, { "epoch": 0.37, "learning_rate": 1.4649340183100098e-05, "loss": 1.4224, "step": 13391 }, { "epoch": 0.37, "learning_rate": 1.464855707059732e-05, "loss": 1.3406, "step": 13392 }, { "epoch": 0.37, "learning_rate": 1.4647773921726418e-05, "loss": 1.3057, "step": 13393 }, { "epoch": 0.37, "learning_rate": 1.4646990736493516e-05, "loss": 1.4133, "step": 13394 }, { "epoch": 0.37, "learning_rate": 1.4646207514904748e-05, "loss": 1.375, "step": 13395 }, { "epoch": 0.37, "learning_rate": 1.4645424256966235e-05, "loss": 1.3164, "step": 13396 }, { "epoch": 0.37, "learning_rate": 1.4644640962684107e-05, "loss": 1.2349, "step": 13397 }, { "epoch": 0.37, "learning_rate": 1.464385763206449e-05, "loss": 1.2449, "step": 13398 }, { "epoch": 0.37, "learning_rate": 1.4643074265113519e-05, "loss": 1.3713, "step": 13399 }, { "epoch": 0.37, "learning_rate": 1.4642290861837314e-05, "loss": 1.2646, "step": 13400 }, { "epoch": 0.37, "learning_rate": 1.4641507422242012e-05, "loss": 1.3115, "step": 13401 }, { "epoch": 0.37, "learning_rate": 1.4640723946333735e-05, "loss": 1.344, "step": 13402 }, { "epoch": 0.37, "learning_rate": 1.463994043411862e-05, "loss": 1.3364, "step": 13403 }, { "epoch": 0.37, "learning_rate": 1.463915688560279e-05, "loss": 1.2222, "step": 13404 }, { "epoch": 0.37, "learning_rate": 1.4638373300792379e-05, "loss": 1.2825, "step": 13405 }, { "epoch": 0.37, "learning_rate": 1.4637589679693516e-05, "loss": 1.3687, "step": 13406 }, { "epoch": 0.37, "learning_rate": 1.4636806022312332e-05, "loss": 1.3926, "step": 13407 }, { "epoch": 0.37, "learning_rate": 1.4636022328654957e-05, "loss": 1.3696, "step": 13408 }, { "epoch": 0.37, "learning_rate": 1.4635238598727526e-05, "loss": 1.4351, "step": 13409 }, { "epoch": 0.37, "learning_rate": 1.4634454832536164e-05, "loss": 1.3003, "step": 13410 }, { "epoch": 0.37, "learning_rate": 1.4633671030087011e-05, "loss": 1.4014, "step": 13411 }, { "epoch": 0.37, "learning_rate": 1.4632887191386191e-05, "loss": 1.3213, "step": 13412 }, { "epoch": 0.37, "learning_rate": 1.4632103316439845e-05, "loss": 1.3621, "step": 13413 }, { "epoch": 0.37, "learning_rate": 1.4631319405254096e-05, "loss": 1.2734, "step": 13414 }, { "epoch": 0.37, "learning_rate": 1.4630535457835085e-05, "loss": 1.4727, "step": 13415 }, { "epoch": 0.37, "learning_rate": 1.4629751474188938e-05, "loss": 1.3396, "step": 13416 }, { "epoch": 0.37, "learning_rate": 1.4628967454321798e-05, "loss": 1.1775, "step": 13417 }, { "epoch": 0.37, "learning_rate": 1.4628183398239788e-05, "loss": 1.2205, "step": 13418 }, { "epoch": 0.37, "learning_rate": 1.4627399305949053e-05, "loss": 1.1978, "step": 13419 }, { "epoch": 0.37, "learning_rate": 1.4626615177455716e-05, "loss": 1.2883, "step": 13420 }, { "epoch": 0.37, "learning_rate": 1.4625831012765921e-05, "loss": 1.2395, "step": 13421 }, { "epoch": 0.37, "learning_rate": 1.4625046811885798e-05, "loss": 1.2595, "step": 13422 }, { "epoch": 0.37, "learning_rate": 1.4624262574821484e-05, "loss": 1.3462, "step": 13423 }, { "epoch": 0.37, "learning_rate": 1.4623478301579115e-05, "loss": 1.2827, "step": 13424 }, { "epoch": 0.37, "learning_rate": 1.4622693992164825e-05, "loss": 1.1753, "step": 13425 }, { "epoch": 0.37, "learning_rate": 1.4621909646584751e-05, "loss": 1.2051, "step": 13426 }, { "epoch": 0.37, "learning_rate": 1.4621125264845029e-05, "loss": 1.26, "step": 13427 }, { "epoch": 0.37, "learning_rate": 1.4620340846951795e-05, "loss": 1.4033, "step": 13428 }, { "epoch": 0.37, "learning_rate": 1.4619556392911189e-05, "loss": 1.2544, "step": 13429 }, { "epoch": 0.37, "learning_rate": 1.4618771902729343e-05, "loss": 1.259, "step": 13430 }, { "epoch": 0.37, "learning_rate": 1.4617987376412401e-05, "loss": 1.3628, "step": 13431 }, { "epoch": 0.37, "learning_rate": 1.4617202813966495e-05, "loss": 1.1665, "step": 13432 }, { "epoch": 0.37, "learning_rate": 1.461641821539777e-05, "loss": 1.292, "step": 13433 }, { "epoch": 0.37, "learning_rate": 1.4615633580712354e-05, "loss": 1.3708, "step": 13434 }, { "epoch": 0.37, "learning_rate": 1.4614848909916393e-05, "loss": 1.167, "step": 13435 }, { "epoch": 0.37, "learning_rate": 1.4614064203016024e-05, "loss": 1.4102, "step": 13436 }, { "epoch": 0.37, "learning_rate": 1.4613279460017389e-05, "loss": 1.4297, "step": 13437 }, { "epoch": 0.37, "learning_rate": 1.4612494680926621e-05, "loss": 1.4075, "step": 13438 }, { "epoch": 0.37, "learning_rate": 1.4611709865749864e-05, "loss": 1.2881, "step": 13439 }, { "epoch": 0.37, "learning_rate": 1.461092501449326e-05, "loss": 1.4185, "step": 13440 }, { "epoch": 0.37, "learning_rate": 1.4610140127162944e-05, "loss": 1.3169, "step": 13441 }, { "epoch": 0.37, "learning_rate": 1.4609355203765063e-05, "loss": 1.3469, "step": 13442 }, { "epoch": 0.37, "learning_rate": 1.4608570244305753e-05, "loss": 1.3584, "step": 13443 }, { "epoch": 0.37, "learning_rate": 1.4607785248791156e-05, "loss": 1.4121, "step": 13444 }, { "epoch": 0.37, "learning_rate": 1.4607000217227414e-05, "loss": 1.1858, "step": 13445 }, { "epoch": 0.37, "learning_rate": 1.4606215149620669e-05, "loss": 1.7979, "step": 13446 }, { "epoch": 0.37, "learning_rate": 1.4605430045977063e-05, "loss": 1.2834, "step": 13447 }, { "epoch": 0.37, "learning_rate": 1.4604644906302735e-05, "loss": 1.3408, "step": 13448 }, { "epoch": 0.37, "learning_rate": 1.4603859730603834e-05, "loss": 1.3411, "step": 13449 }, { "epoch": 0.37, "learning_rate": 1.46030745188865e-05, "loss": 1.3, "step": 13450 }, { "epoch": 0.37, "learning_rate": 1.460228927115687e-05, "loss": 1.3711, "step": 13451 }, { "epoch": 0.37, "learning_rate": 1.46015039874211e-05, "loss": 1.4219, "step": 13452 }, { "epoch": 0.37, "learning_rate": 1.4600718667685318e-05, "loss": 1.2839, "step": 13453 }, { "epoch": 0.37, "learning_rate": 1.4599933311955683e-05, "loss": 1.1692, "step": 13454 }, { "epoch": 0.37, "learning_rate": 1.4599147920238333e-05, "loss": 1.3428, "step": 13455 }, { "epoch": 0.37, "learning_rate": 1.4598362492539411e-05, "loss": 1.4344, "step": 13456 }, { "epoch": 0.37, "learning_rate": 1.4597577028865063e-05, "loss": 1.3643, "step": 13457 }, { "epoch": 0.37, "learning_rate": 1.4596791529221435e-05, "loss": 1.387, "step": 13458 }, { "epoch": 0.37, "learning_rate": 1.4596005993614668e-05, "loss": 1.3066, "step": 13459 }, { "epoch": 0.37, "learning_rate": 1.4595220422050915e-05, "loss": 1.769, "step": 13460 }, { "epoch": 0.37, "learning_rate": 1.4594434814536318e-05, "loss": 1.1257, "step": 13461 }, { "epoch": 0.37, "learning_rate": 1.4593649171077022e-05, "loss": 1.3618, "step": 13462 }, { "epoch": 0.37, "learning_rate": 1.4592863491679176e-05, "loss": 1.3003, "step": 13463 }, { "epoch": 0.37, "learning_rate": 1.4592077776348928e-05, "loss": 1.1785, "step": 13464 }, { "epoch": 0.37, "learning_rate": 1.4591292025092418e-05, "loss": 1.3303, "step": 13465 }, { "epoch": 0.37, "learning_rate": 1.4590506237915802e-05, "loss": 1.2063, "step": 13466 }, { "epoch": 0.37, "learning_rate": 1.4589720414825221e-05, "loss": 1.1943, "step": 13467 }, { "epoch": 0.37, "learning_rate": 1.4588934555826828e-05, "loss": 1.4102, "step": 13468 }, { "epoch": 0.37, "learning_rate": 1.4588148660926766e-05, "loss": 1.3999, "step": 13469 }, { "epoch": 0.37, "learning_rate": 1.4587362730131189e-05, "loss": 1.7026, "step": 13470 }, { "epoch": 0.37, "learning_rate": 1.4586576763446241e-05, "loss": 1.2781, "step": 13471 }, { "epoch": 0.37, "learning_rate": 1.4585790760878076e-05, "loss": 1.7358, "step": 13472 }, { "epoch": 0.37, "learning_rate": 1.4585004722432838e-05, "loss": 1.2175, "step": 13473 }, { "epoch": 0.37, "learning_rate": 1.4584218648116681e-05, "loss": 1.3618, "step": 13474 }, { "epoch": 0.37, "learning_rate": 1.4583432537935753e-05, "loss": 1.4299, "step": 13475 }, { "epoch": 0.37, "learning_rate": 1.4582646391896203e-05, "loss": 1.2881, "step": 13476 }, { "epoch": 0.37, "learning_rate": 1.4581860210004181e-05, "loss": 1.3916, "step": 13477 }, { "epoch": 0.37, "learning_rate": 1.4581073992265844e-05, "loss": 1.3665, "step": 13478 }, { "epoch": 0.37, "learning_rate": 1.4580287738687333e-05, "loss": 1.249, "step": 13479 }, { "epoch": 0.37, "learning_rate": 1.457950144927481e-05, "loss": 1.4319, "step": 13480 }, { "epoch": 0.37, "learning_rate": 1.4578715124034415e-05, "loss": 1.5122, "step": 13481 }, { "epoch": 0.37, "learning_rate": 1.4577928762972311e-05, "loss": 1.3298, "step": 13482 }, { "epoch": 0.37, "learning_rate": 1.4577142366094643e-05, "loss": 1.2581, "step": 13483 }, { "epoch": 0.37, "learning_rate": 1.4576355933407565e-05, "loss": 1.4146, "step": 13484 }, { "epoch": 0.37, "learning_rate": 1.457556946491723e-05, "loss": 1.4016, "step": 13485 }, { "epoch": 0.37, "learning_rate": 1.4574782960629792e-05, "loss": 1.313, "step": 13486 }, { "epoch": 0.37, "learning_rate": 1.4573996420551405e-05, "loss": 1.3857, "step": 13487 }, { "epoch": 0.37, "learning_rate": 1.4573209844688217e-05, "loss": 1.3423, "step": 13488 }, { "epoch": 0.37, "learning_rate": 1.4572423233046386e-05, "loss": 1.219, "step": 13489 }, { "epoch": 0.37, "learning_rate": 1.4571636585632067e-05, "loss": 1.188, "step": 13490 }, { "epoch": 0.37, "learning_rate": 1.4570849902451416e-05, "loss": 1.2402, "step": 13491 }, { "epoch": 0.37, "learning_rate": 1.457006318351058e-05, "loss": 1.4233, "step": 13492 }, { "epoch": 0.37, "learning_rate": 1.4569276428815722e-05, "loss": 1.8496, "step": 13493 }, { "epoch": 0.37, "learning_rate": 1.4568489638372992e-05, "loss": 1.2056, "step": 13494 }, { "epoch": 0.37, "learning_rate": 1.456770281218855e-05, "loss": 1.3972, "step": 13495 }, { "epoch": 0.37, "learning_rate": 1.4566915950268542e-05, "loss": 1.3882, "step": 13496 }, { "epoch": 0.37, "learning_rate": 1.456612905261914e-05, "loss": 1.4504, "step": 13497 }, { "epoch": 0.37, "learning_rate": 1.4565342119246487e-05, "loss": 1.4551, "step": 13498 }, { "epoch": 0.37, "learning_rate": 1.4564555150156746e-05, "loss": 1.4817, "step": 13499 }, { "epoch": 0.37, "learning_rate": 1.4563768145356065e-05, "loss": 1.3032, "step": 13500 }, { "epoch": 0.37, "learning_rate": 1.4562981104850616e-05, "loss": 1.3657, "step": 13501 }, { "epoch": 0.37, "learning_rate": 1.4562194028646545e-05, "loss": 1.4121, "step": 13502 }, { "epoch": 0.37, "learning_rate": 1.4561406916750014e-05, "loss": 1.4175, "step": 13503 }, { "epoch": 0.37, "learning_rate": 1.456061976916718e-05, "loss": 1.3032, "step": 13504 }, { "epoch": 0.37, "learning_rate": 1.4559832585904204e-05, "loss": 1.2795, "step": 13505 }, { "epoch": 0.37, "learning_rate": 1.455904536696724e-05, "loss": 1.2312, "step": 13506 }, { "epoch": 0.37, "learning_rate": 1.4558258112362448e-05, "loss": 1.261, "step": 13507 }, { "epoch": 0.37, "learning_rate": 1.4557470822095988e-05, "loss": 1.1758, "step": 13508 }, { "epoch": 0.37, "learning_rate": 1.455668349617402e-05, "loss": 1.7349, "step": 13509 }, { "epoch": 0.37, "learning_rate": 1.4555896134602703e-05, "loss": 1.3882, "step": 13510 }, { "epoch": 0.37, "learning_rate": 1.4555108737388199e-05, "loss": 1.2682, "step": 13511 }, { "epoch": 0.37, "learning_rate": 1.4554321304536662e-05, "loss": 1.2888, "step": 13512 }, { "epoch": 0.37, "learning_rate": 1.4553533836054261e-05, "loss": 1.3408, "step": 13513 }, { "epoch": 0.37, "learning_rate": 1.455274633194715e-05, "loss": 1.2317, "step": 13514 }, { "epoch": 0.37, "learning_rate": 1.4551958792221492e-05, "loss": 1.4482, "step": 13515 }, { "epoch": 0.37, "learning_rate": 1.4551171216883448e-05, "loss": 1.2004, "step": 13516 }, { "epoch": 0.37, "learning_rate": 1.4550383605939185e-05, "loss": 1.5146, "step": 13517 }, { "epoch": 0.37, "learning_rate": 1.4549595959394856e-05, "loss": 1.7246, "step": 13518 }, { "epoch": 0.37, "learning_rate": 1.454880827725663e-05, "loss": 1.3608, "step": 13519 }, { "epoch": 0.37, "learning_rate": 1.4548020559530666e-05, "loss": 1.3657, "step": 13520 }, { "epoch": 0.37, "learning_rate": 1.454723280622313e-05, "loss": 1.2361, "step": 13521 }, { "epoch": 0.37, "learning_rate": 1.454644501734018e-05, "loss": 1.3779, "step": 13522 }, { "epoch": 0.37, "learning_rate": 1.4545657192887984e-05, "loss": 1.4626, "step": 13523 }, { "epoch": 0.37, "learning_rate": 1.4544869332872702e-05, "loss": 1.3286, "step": 13524 }, { "epoch": 0.37, "learning_rate": 1.4544081437300502e-05, "loss": 1.416, "step": 13525 }, { "epoch": 0.37, "learning_rate": 1.454329350617754e-05, "loss": 1.2686, "step": 13526 }, { "epoch": 0.37, "learning_rate": 1.4542505539509993e-05, "loss": 1.2654, "step": 13527 }, { "epoch": 0.37, "learning_rate": 1.4541717537304015e-05, "loss": 1.3225, "step": 13528 }, { "epoch": 0.37, "learning_rate": 1.4540929499565776e-05, "loss": 1.4128, "step": 13529 }, { "epoch": 0.37, "learning_rate": 1.4540141426301437e-05, "loss": 1.3877, "step": 13530 }, { "epoch": 0.37, "learning_rate": 1.4539353317517168e-05, "loss": 1.3047, "step": 13531 }, { "epoch": 0.37, "learning_rate": 1.4538565173219135e-05, "loss": 1.4263, "step": 13532 }, { "epoch": 0.37, "learning_rate": 1.45377769934135e-05, "loss": 1.2605, "step": 13533 }, { "epoch": 0.37, "learning_rate": 1.4536988778106433e-05, "loss": 1.4419, "step": 13534 }, { "epoch": 0.37, "learning_rate": 1.4536200527304098e-05, "loss": 1.2334, "step": 13535 }, { "epoch": 0.37, "learning_rate": 1.4535412241012665e-05, "loss": 1.4475, "step": 13536 }, { "epoch": 0.37, "learning_rate": 1.4534623919238297e-05, "loss": 1.2559, "step": 13537 }, { "epoch": 0.37, "learning_rate": 1.4533835561987165e-05, "loss": 1.2644, "step": 13538 }, { "epoch": 0.37, "learning_rate": 1.4533047169265438e-05, "loss": 1.5027, "step": 13539 }, { "epoch": 0.37, "learning_rate": 1.453225874107928e-05, "loss": 1.3972, "step": 13540 }, { "epoch": 0.37, "learning_rate": 1.4531470277434858e-05, "loss": 1.3086, "step": 13541 }, { "epoch": 0.37, "learning_rate": 1.4530681778338348e-05, "loss": 1.3311, "step": 13542 }, { "epoch": 0.37, "learning_rate": 1.452989324379591e-05, "loss": 1.3918, "step": 13543 }, { "epoch": 0.37, "learning_rate": 1.4529104673813717e-05, "loss": 1.4531, "step": 13544 }, { "epoch": 0.37, "learning_rate": 1.4528316068397943e-05, "loss": 1.2949, "step": 13545 }, { "epoch": 0.37, "learning_rate": 1.4527527427554749e-05, "loss": 1.7871, "step": 13546 }, { "epoch": 0.37, "learning_rate": 1.452673875129031e-05, "loss": 1.7173, "step": 13547 }, { "epoch": 0.37, "learning_rate": 1.45259500396108e-05, "loss": 1.073, "step": 13548 }, { "epoch": 0.37, "learning_rate": 1.452516129252238e-05, "loss": 1.1191, "step": 13549 }, { "epoch": 0.37, "learning_rate": 1.452437251003123e-05, "loss": 1.2954, "step": 13550 }, { "epoch": 0.37, "learning_rate": 1.4523583692143514e-05, "loss": 1.3154, "step": 13551 }, { "epoch": 0.37, "learning_rate": 1.4522794838865411e-05, "loss": 1.2219, "step": 13552 }, { "epoch": 0.37, "learning_rate": 1.4522005950203083e-05, "loss": 1.3789, "step": 13553 }, { "epoch": 0.37, "learning_rate": 1.4521217026162709e-05, "loss": 1.2432, "step": 13554 }, { "epoch": 0.37, "learning_rate": 1.4520428066750456e-05, "loss": 1.3433, "step": 13555 }, { "epoch": 0.37, "learning_rate": 1.4519639071972504e-05, "loss": 1.3682, "step": 13556 }, { "epoch": 0.37, "learning_rate": 1.4518850041835017e-05, "loss": 1.1924, "step": 13557 }, { "epoch": 0.37, "learning_rate": 1.4518060976344176e-05, "loss": 1.3013, "step": 13558 }, { "epoch": 0.37, "learning_rate": 1.451727187550615e-05, "loss": 1.2676, "step": 13559 }, { "epoch": 0.37, "learning_rate": 1.451648273932711e-05, "loss": 1.5405, "step": 13560 }, { "epoch": 0.37, "learning_rate": 1.4515693567813234e-05, "loss": 1.3911, "step": 13561 }, { "epoch": 0.37, "learning_rate": 1.4514904360970697e-05, "loss": 1.2571, "step": 13562 }, { "epoch": 0.37, "learning_rate": 1.4514115118805668e-05, "loss": 1.4639, "step": 13563 }, { "epoch": 0.37, "learning_rate": 1.4513325841324327e-05, "loss": 1.7256, "step": 13564 }, { "epoch": 0.37, "learning_rate": 1.4512536528532845e-05, "loss": 1.2671, "step": 13565 }, { "epoch": 0.37, "learning_rate": 1.4511747180437404e-05, "loss": 1.4116, "step": 13566 }, { "epoch": 0.37, "learning_rate": 1.4510957797044169e-05, "loss": 1.3452, "step": 13567 }, { "epoch": 0.37, "learning_rate": 1.4510168378359326e-05, "loss": 1.4158, "step": 13568 }, { "epoch": 0.37, "learning_rate": 1.4509378924389044e-05, "loss": 1.3103, "step": 13569 }, { "epoch": 0.37, "learning_rate": 1.4508589435139504e-05, "loss": 1.4497, "step": 13570 }, { "epoch": 0.37, "learning_rate": 1.4507799910616877e-05, "loss": 1.4221, "step": 13571 }, { "epoch": 0.37, "learning_rate": 1.4507010350827346e-05, "loss": 1.3679, "step": 13572 }, { "epoch": 0.37, "learning_rate": 1.4506220755777083e-05, "loss": 1.4419, "step": 13573 }, { "epoch": 0.37, "learning_rate": 1.450543112547227e-05, "loss": 1.3916, "step": 13574 }, { "epoch": 0.37, "learning_rate": 1.450464145991908e-05, "loss": 1.4849, "step": 13575 }, { "epoch": 0.37, "learning_rate": 1.4503851759123695e-05, "loss": 1.3113, "step": 13576 }, { "epoch": 0.37, "learning_rate": 1.450306202309229e-05, "loss": 1.3586, "step": 13577 }, { "epoch": 0.37, "learning_rate": 1.4502272251831047e-05, "loss": 1.1931, "step": 13578 }, { "epoch": 0.37, "learning_rate": 1.4501482445346141e-05, "loss": 1.3916, "step": 13579 }, { "epoch": 0.37, "learning_rate": 1.4500692603643756e-05, "loss": 1.6924, "step": 13580 }, { "epoch": 0.37, "learning_rate": 1.4499902726730066e-05, "loss": 1.3242, "step": 13581 }, { "epoch": 0.37, "learning_rate": 1.4499112814611256e-05, "loss": 1.6313, "step": 13582 }, { "epoch": 0.37, "learning_rate": 1.44983228672935e-05, "loss": 1.3245, "step": 13583 }, { "epoch": 0.37, "learning_rate": 1.4497532884782985e-05, "loss": 1.1716, "step": 13584 }, { "epoch": 0.37, "learning_rate": 1.4496742867085884e-05, "loss": 1.3953, "step": 13585 }, { "epoch": 0.37, "learning_rate": 1.4495952814208383e-05, "loss": 1.2441, "step": 13586 }, { "epoch": 0.37, "learning_rate": 1.4495162726156659e-05, "loss": 1.2556, "step": 13587 }, { "epoch": 0.37, "learning_rate": 1.44943726029369e-05, "loss": 1.5056, "step": 13588 }, { "epoch": 0.37, "learning_rate": 1.4493582444555278e-05, "loss": 1.166, "step": 13589 }, { "epoch": 0.37, "learning_rate": 1.4492792251017985e-05, "loss": 1.385, "step": 13590 }, { "epoch": 0.37, "learning_rate": 1.4492002022331194e-05, "loss": 1.1765, "step": 13591 }, { "epoch": 0.37, "learning_rate": 1.4491211758501094e-05, "loss": 1.3916, "step": 13592 }, { "epoch": 0.37, "learning_rate": 1.4490421459533863e-05, "loss": 1.2488, "step": 13593 }, { "epoch": 0.37, "learning_rate": 1.4489631125435685e-05, "loss": 1.155, "step": 13594 }, { "epoch": 0.37, "learning_rate": 1.4488840756212747e-05, "loss": 1.2942, "step": 13595 }, { "epoch": 0.37, "learning_rate": 1.448805035187123e-05, "loss": 1.1836, "step": 13596 }, { "epoch": 0.37, "learning_rate": 1.4487259912417317e-05, "loss": 1.4338, "step": 13597 }, { "epoch": 0.37, "learning_rate": 1.4486469437857192e-05, "loss": 1.3711, "step": 13598 }, { "epoch": 0.37, "learning_rate": 1.4485678928197043e-05, "loss": 1.2532, "step": 13599 }, { "epoch": 0.37, "learning_rate": 1.4484888383443045e-05, "loss": 1.3743, "step": 13600 }, { "epoch": 0.37, "learning_rate": 1.4484097803601393e-05, "loss": 1.1924, "step": 13601 }, { "epoch": 0.37, "learning_rate": 1.4483307188678268e-05, "loss": 1.314, "step": 13602 }, { "epoch": 0.37, "learning_rate": 1.4482516538679857e-05, "loss": 1.2495, "step": 13603 }, { "epoch": 0.37, "learning_rate": 1.4481725853612342e-05, "loss": 1.3779, "step": 13604 }, { "epoch": 0.37, "learning_rate": 1.4480935133481913e-05, "loss": 1.1741, "step": 13605 }, { "epoch": 0.37, "learning_rate": 1.4480144378294754e-05, "loss": 1.3315, "step": 13606 }, { "epoch": 0.37, "learning_rate": 1.4479353588057052e-05, "loss": 1.3118, "step": 13607 }, { "epoch": 0.37, "learning_rate": 1.4478562762774992e-05, "loss": 1.2563, "step": 13608 }, { "epoch": 0.37, "learning_rate": 1.4477771902454767e-05, "loss": 1.2632, "step": 13609 }, { "epoch": 0.37, "learning_rate": 1.4476981007102554e-05, "loss": 1.3081, "step": 13610 }, { "epoch": 0.37, "learning_rate": 1.4476190076724554e-05, "loss": 1.2935, "step": 13611 }, { "epoch": 0.37, "learning_rate": 1.4475399111326944e-05, "loss": 1.3276, "step": 13612 }, { "epoch": 0.37, "learning_rate": 1.4474608110915917e-05, "loss": 1.5149, "step": 13613 }, { "epoch": 0.37, "learning_rate": 1.4473817075497661e-05, "loss": 1.3345, "step": 13614 }, { "epoch": 0.37, "learning_rate": 1.447302600507836e-05, "loss": 1.231, "step": 13615 }, { "epoch": 0.37, "learning_rate": 1.447223489966421e-05, "loss": 1.4175, "step": 13616 }, { "epoch": 0.37, "learning_rate": 1.4471443759261399e-05, "loss": 1.2439, "step": 13617 }, { "epoch": 0.37, "learning_rate": 1.447065258387611e-05, "loss": 1.249, "step": 13618 }, { "epoch": 0.37, "learning_rate": 1.4469861373514542e-05, "loss": 1.2952, "step": 13619 }, { "epoch": 0.37, "learning_rate": 1.4469070128182878e-05, "loss": 1.3765, "step": 13620 }, { "epoch": 0.37, "learning_rate": 1.4468278847887312e-05, "loss": 1.3567, "step": 13621 }, { "epoch": 0.37, "learning_rate": 1.446748753263403e-05, "loss": 1.2285, "step": 13622 }, { "epoch": 0.37, "learning_rate": 1.4466696182429232e-05, "loss": 1.2485, "step": 13623 }, { "epoch": 0.37, "learning_rate": 1.4465904797279095e-05, "loss": 1.3867, "step": 13624 }, { "epoch": 0.37, "learning_rate": 1.4465113377189828e-05, "loss": 1.3906, "step": 13625 }, { "epoch": 0.37, "learning_rate": 1.4464321922167608e-05, "loss": 1.3105, "step": 13626 }, { "epoch": 0.37, "learning_rate": 1.4463530432218636e-05, "loss": 1.3276, "step": 13627 }, { "epoch": 0.37, "learning_rate": 1.4462738907349096e-05, "loss": 1.2583, "step": 13628 }, { "epoch": 0.37, "learning_rate": 1.446194734756519e-05, "loss": 1.1787, "step": 13629 }, { "epoch": 0.37, "learning_rate": 1.4461155752873104e-05, "loss": 1.304, "step": 13630 }, { "epoch": 0.37, "learning_rate": 1.4460364123279033e-05, "loss": 1.4331, "step": 13631 }, { "epoch": 0.37, "learning_rate": 1.4459572458789173e-05, "loss": 1.4465, "step": 13632 }, { "epoch": 0.37, "learning_rate": 1.4458780759409715e-05, "loss": 1.3794, "step": 13633 }, { "epoch": 0.37, "learning_rate": 1.4457989025146847e-05, "loss": 1.3374, "step": 13634 }, { "epoch": 0.37, "learning_rate": 1.4457197256006777e-05, "loss": 1.3374, "step": 13635 }, { "epoch": 0.37, "learning_rate": 1.4456405451995688e-05, "loss": 1.3662, "step": 13636 }, { "epoch": 0.37, "learning_rate": 1.445561361311978e-05, "loss": 1.377, "step": 13637 }, { "epoch": 0.37, "learning_rate": 1.4454821739385243e-05, "loss": 1.4341, "step": 13638 }, { "epoch": 0.37, "learning_rate": 1.4454029830798275e-05, "loss": 1.3066, "step": 13639 }, { "epoch": 0.37, "learning_rate": 1.4453237887365075e-05, "loss": 1.2427, "step": 13640 }, { "epoch": 0.37, "learning_rate": 1.4452445909091835e-05, "loss": 1.3696, "step": 13641 }, { "epoch": 0.37, "learning_rate": 1.4451653895984752e-05, "loss": 1.3081, "step": 13642 }, { "epoch": 0.37, "learning_rate": 1.4450861848050021e-05, "loss": 1.4255, "step": 13643 }, { "epoch": 0.37, "learning_rate": 1.4450069765293844e-05, "loss": 1.2781, "step": 13644 }, { "epoch": 0.37, "learning_rate": 1.4449277647722408e-05, "loss": 1.2998, "step": 13645 }, { "epoch": 0.37, "learning_rate": 1.444848549534192e-05, "loss": 1.2412, "step": 13646 }, { "epoch": 0.37, "learning_rate": 1.4447693308158572e-05, "loss": 1.075, "step": 13647 }, { "epoch": 0.37, "learning_rate": 1.4446901086178563e-05, "loss": 1.8198, "step": 13648 }, { "epoch": 0.37, "learning_rate": 1.444610882940809e-05, "loss": 1.7427, "step": 13649 }, { "epoch": 0.37, "learning_rate": 1.4445316537853356e-05, "loss": 1.311, "step": 13650 }, { "epoch": 0.37, "learning_rate": 1.4444524211520552e-05, "loss": 1.335, "step": 13651 }, { "epoch": 0.37, "learning_rate": 1.444373185041588e-05, "loss": 1.4287, "step": 13652 }, { "epoch": 0.37, "learning_rate": 1.4442939454545542e-05, "loss": 1.2405, "step": 13653 }, { "epoch": 0.37, "learning_rate": 1.4442147023915735e-05, "loss": 1.2786, "step": 13654 }, { "epoch": 0.37, "learning_rate": 1.4441354558532654e-05, "loss": 1.3293, "step": 13655 }, { "epoch": 0.37, "learning_rate": 1.444056205840251e-05, "loss": 1.1653, "step": 13656 }, { "epoch": 0.37, "learning_rate": 1.443976952353149e-05, "loss": 1.2073, "step": 13657 }, { "epoch": 0.37, "learning_rate": 1.4438976953925808e-05, "loss": 1.3572, "step": 13658 }, { "epoch": 0.37, "learning_rate": 1.443818434959165e-05, "loss": 1.3, "step": 13659 }, { "epoch": 0.37, "learning_rate": 1.4437391710535231e-05, "loss": 1.2366, "step": 13660 }, { "epoch": 0.37, "learning_rate": 1.4436599036762742e-05, "loss": 1.3076, "step": 13661 }, { "epoch": 0.37, "learning_rate": 1.4435806328280393e-05, "loss": 1.3425, "step": 13662 }, { "epoch": 0.37, "learning_rate": 1.4435013585094377e-05, "loss": 1.2478, "step": 13663 }, { "epoch": 0.37, "learning_rate": 1.44342208072109e-05, "loss": 1.2002, "step": 13664 }, { "epoch": 0.37, "learning_rate": 1.4433427994636167e-05, "loss": 1.3467, "step": 13665 }, { "epoch": 0.37, "learning_rate": 1.4432635147376378e-05, "loss": 1.3943, "step": 13666 }, { "epoch": 0.37, "learning_rate": 1.4431842265437731e-05, "loss": 1.2407, "step": 13667 }, { "epoch": 0.37, "learning_rate": 1.4431049348826442e-05, "loss": 1.2654, "step": 13668 }, { "epoch": 0.37, "learning_rate": 1.4430256397548701e-05, "loss": 1.2429, "step": 13669 }, { "epoch": 0.37, "learning_rate": 1.4429463411610718e-05, "loss": 1.4314, "step": 13670 }, { "epoch": 0.37, "learning_rate": 1.4428670391018695e-05, "loss": 1.3657, "step": 13671 }, { "epoch": 0.37, "learning_rate": 1.4427877335778841e-05, "loss": 1.303, "step": 13672 }, { "epoch": 0.37, "learning_rate": 1.4427084245897353e-05, "loss": 1.3323, "step": 13673 }, { "epoch": 0.37, "learning_rate": 1.4426291121380445e-05, "loss": 1.3167, "step": 13674 }, { "epoch": 0.37, "learning_rate": 1.4425497962234312e-05, "loss": 1.2937, "step": 13675 }, { "epoch": 0.37, "learning_rate": 1.4424704768465165e-05, "loss": 1.2881, "step": 13676 }, { "epoch": 0.37, "learning_rate": 1.442391154007921e-05, "loss": 1.3394, "step": 13677 }, { "epoch": 0.37, "learning_rate": 1.4423118277082651e-05, "loss": 1.416, "step": 13678 }, { "epoch": 0.37, "learning_rate": 1.4422324979481692e-05, "loss": 1.2166, "step": 13679 }, { "epoch": 0.37, "learning_rate": 1.4421531647282545e-05, "loss": 1.7329, "step": 13680 }, { "epoch": 0.37, "learning_rate": 1.4420738280491411e-05, "loss": 1.4155, "step": 13681 }, { "epoch": 0.37, "learning_rate": 1.4419944879114502e-05, "loss": 1.2407, "step": 13682 }, { "epoch": 0.37, "learning_rate": 1.441915144315802e-05, "loss": 1.2795, "step": 13683 }, { "epoch": 0.37, "learning_rate": 1.4418357972628179e-05, "loss": 1.4438, "step": 13684 }, { "epoch": 0.37, "learning_rate": 1.4417564467531178e-05, "loss": 1.2812, "step": 13685 }, { "epoch": 0.37, "learning_rate": 1.4416770927873232e-05, "loss": 1.4243, "step": 13686 }, { "epoch": 0.37, "learning_rate": 1.441597735366055e-05, "loss": 1.2983, "step": 13687 }, { "epoch": 0.37, "learning_rate": 1.4415183744899333e-05, "loss": 1.2629, "step": 13688 }, { "epoch": 0.37, "learning_rate": 1.4414390101595796e-05, "loss": 1.2725, "step": 13689 }, { "epoch": 0.37, "learning_rate": 1.441359642375615e-05, "loss": 1.4995, "step": 13690 }, { "epoch": 0.37, "learning_rate": 1.4412802711386598e-05, "loss": 1.4285, "step": 13691 }, { "epoch": 0.37, "learning_rate": 1.4412008964493351e-05, "loss": 1.4766, "step": 13692 }, { "epoch": 0.37, "learning_rate": 1.441121518308262e-05, "loss": 1.2, "step": 13693 }, { "epoch": 0.37, "learning_rate": 1.4410421367160621e-05, "loss": 1.3025, "step": 13694 }, { "epoch": 0.37, "learning_rate": 1.4409627516733555e-05, "loss": 1.3772, "step": 13695 }, { "epoch": 0.37, "learning_rate": 1.4408833631807639e-05, "loss": 1.3638, "step": 13696 }, { "epoch": 0.37, "learning_rate": 1.4408039712389081e-05, "loss": 1.2585, "step": 13697 }, { "epoch": 0.37, "learning_rate": 1.4407245758484094e-05, "loss": 1.3879, "step": 13698 }, { "epoch": 0.37, "learning_rate": 1.4406451770098885e-05, "loss": 1.3455, "step": 13699 }, { "epoch": 0.37, "learning_rate": 1.4405657747239675e-05, "loss": 1.3984, "step": 13700 }, { "epoch": 0.37, "learning_rate": 1.4404863689912668e-05, "loss": 1.3459, "step": 13701 }, { "epoch": 0.37, "learning_rate": 1.4404069598124078e-05, "loss": 1.3071, "step": 13702 }, { "epoch": 0.37, "learning_rate": 1.4403275471880118e-05, "loss": 1.3293, "step": 13703 }, { "epoch": 0.37, "learning_rate": 1.4402481311187002e-05, "loss": 1.3936, "step": 13704 }, { "epoch": 0.37, "learning_rate": 1.4401687116050945e-05, "loss": 1.4492, "step": 13705 }, { "epoch": 0.37, "learning_rate": 1.4400892886478153e-05, "loss": 1.4058, "step": 13706 }, { "epoch": 0.37, "learning_rate": 1.4400098622474847e-05, "loss": 1.188, "step": 13707 }, { "epoch": 0.37, "learning_rate": 1.4399304324047237e-05, "loss": 1.3467, "step": 13708 }, { "epoch": 0.37, "learning_rate": 1.4398509991201542e-05, "loss": 1.2256, "step": 13709 }, { "epoch": 0.37, "learning_rate": 1.4397715623943968e-05, "loss": 1.3977, "step": 13710 }, { "epoch": 0.37, "learning_rate": 1.439692122228074e-05, "loss": 1.3391, "step": 13711 }, { "epoch": 0.37, "learning_rate": 1.4396126786218066e-05, "loss": 1.2107, "step": 13712 }, { "epoch": 0.37, "learning_rate": 1.4395332315762165e-05, "loss": 1.7588, "step": 13713 }, { "epoch": 0.37, "learning_rate": 1.4394537810919247e-05, "loss": 1.3181, "step": 13714 }, { "epoch": 0.37, "learning_rate": 1.4393743271695535e-05, "loss": 1.405, "step": 13715 }, { "epoch": 0.37, "learning_rate": 1.439294869809724e-05, "loss": 1.7446, "step": 13716 }, { "epoch": 0.37, "learning_rate": 1.4392154090130579e-05, "loss": 1.2461, "step": 13717 }, { "epoch": 0.37, "learning_rate": 1.439135944780177e-05, "loss": 1.4062, "step": 13718 }, { "epoch": 0.37, "learning_rate": 1.4390564771117032e-05, "loss": 1.3779, "step": 13719 }, { "epoch": 0.37, "learning_rate": 1.4389770060082578e-05, "loss": 1.373, "step": 13720 }, { "epoch": 0.37, "learning_rate": 1.438897531470463e-05, "loss": 1.3672, "step": 13721 }, { "epoch": 0.37, "learning_rate": 1.43881805349894e-05, "loss": 1.3496, "step": 13722 }, { "epoch": 0.37, "learning_rate": 1.438738572094311e-05, "loss": 1.3613, "step": 13723 }, { "epoch": 0.37, "learning_rate": 1.4386590872571975e-05, "loss": 1.3804, "step": 13724 }, { "epoch": 0.37, "learning_rate": 1.4385795989882221e-05, "loss": 1.4946, "step": 13725 }, { "epoch": 0.37, "learning_rate": 1.4385001072880056e-05, "loss": 1.1843, "step": 13726 }, { "epoch": 0.37, "learning_rate": 1.4384206121571708e-05, "loss": 1.2573, "step": 13727 }, { "epoch": 0.37, "learning_rate": 1.438341113596339e-05, "loss": 1.3186, "step": 13728 }, { "epoch": 0.37, "learning_rate": 1.4382616116061327e-05, "loss": 1.4314, "step": 13729 }, { "epoch": 0.37, "learning_rate": 1.4381821061871738e-05, "loss": 1.3296, "step": 13730 }, { "epoch": 0.37, "learning_rate": 1.4381025973400839e-05, "loss": 1.3521, "step": 13731 }, { "epoch": 0.38, "learning_rate": 1.4380230850654849e-05, "loss": 1.4473, "step": 13732 }, { "epoch": 0.38, "learning_rate": 1.4379435693639997e-05, "loss": 1.1631, "step": 13733 }, { "epoch": 0.38, "learning_rate": 1.43786405023625e-05, "loss": 1.1719, "step": 13734 }, { "epoch": 0.38, "learning_rate": 1.4377845276828576e-05, "loss": 1.325, "step": 13735 }, { "epoch": 0.38, "learning_rate": 1.437705001704445e-05, "loss": 1.155, "step": 13736 }, { "epoch": 0.38, "learning_rate": 1.4376254723016347e-05, "loss": 1.188, "step": 13737 }, { "epoch": 0.38, "learning_rate": 1.4375459394750482e-05, "loss": 1.4187, "step": 13738 }, { "epoch": 0.38, "learning_rate": 1.4374664032253081e-05, "loss": 1.7314, "step": 13739 }, { "epoch": 0.38, "learning_rate": 1.4373868635530364e-05, "loss": 1.3794, "step": 13740 }, { "epoch": 0.38, "learning_rate": 1.4373073204588556e-05, "loss": 1.3379, "step": 13741 }, { "epoch": 0.38, "learning_rate": 1.4372277739433878e-05, "loss": 1.124, "step": 13742 }, { "epoch": 0.38, "learning_rate": 1.4371482240072558e-05, "loss": 1.5393, "step": 13743 }, { "epoch": 0.38, "learning_rate": 1.4370686706510814e-05, "loss": 1.3638, "step": 13744 }, { "epoch": 0.38, "learning_rate": 1.4369891138754874e-05, "loss": 1.3501, "step": 13745 }, { "epoch": 0.38, "learning_rate": 1.4369095536810961e-05, "loss": 1.3296, "step": 13746 }, { "epoch": 0.38, "learning_rate": 1.4368299900685298e-05, "loss": 1.3267, "step": 13747 }, { "epoch": 0.38, "learning_rate": 1.436750423038411e-05, "loss": 1.4412, "step": 13748 }, { "epoch": 0.38, "learning_rate": 1.4366708525913624e-05, "loss": 1.4429, "step": 13749 }, { "epoch": 0.38, "learning_rate": 1.4365912787280065e-05, "loss": 1.4172, "step": 13750 }, { "epoch": 0.38, "learning_rate": 1.4365117014489656e-05, "loss": 1.3545, "step": 13751 }, { "epoch": 0.38, "learning_rate": 1.4364321207548623e-05, "loss": 1.304, "step": 13752 }, { "epoch": 0.38, "learning_rate": 1.4363525366463193e-05, "loss": 1.3955, "step": 13753 }, { "epoch": 0.38, "learning_rate": 1.4362729491239595e-05, "loss": 1.3877, "step": 13754 }, { "epoch": 0.38, "learning_rate": 1.4361933581884051e-05, "loss": 1.1675, "step": 13755 }, { "epoch": 0.38, "learning_rate": 1.4361137638402791e-05, "loss": 1.4692, "step": 13756 }, { "epoch": 0.38, "learning_rate": 1.436034166080204e-05, "loss": 1.1412, "step": 13757 }, { "epoch": 0.38, "learning_rate": 1.4359545649088027e-05, "loss": 1.3105, "step": 13758 }, { "epoch": 0.38, "learning_rate": 1.4358749603266978e-05, "loss": 1.3469, "step": 13759 }, { "epoch": 0.38, "learning_rate": 1.4357953523345122e-05, "loss": 1.1047, "step": 13760 }, { "epoch": 0.38, "learning_rate": 1.4357157409328686e-05, "loss": 1.4409, "step": 13761 }, { "epoch": 0.38, "learning_rate": 1.43563612612239e-05, "loss": 1.1399, "step": 13762 }, { "epoch": 0.38, "learning_rate": 1.4355565079036991e-05, "loss": 1.4795, "step": 13763 }, { "epoch": 0.38, "learning_rate": 1.4354768862774192e-05, "loss": 1.3782, "step": 13764 }, { "epoch": 0.38, "learning_rate": 1.4353972612441726e-05, "loss": 1.2966, "step": 13765 }, { "epoch": 0.38, "learning_rate": 1.4353176328045828e-05, "loss": 1.3179, "step": 13766 }, { "epoch": 0.38, "learning_rate": 1.4352380009592723e-05, "loss": 1.3782, "step": 13767 }, { "epoch": 0.38, "learning_rate": 1.4351583657088647e-05, "loss": 1.3635, "step": 13768 }, { "epoch": 0.38, "learning_rate": 1.4350787270539824e-05, "loss": 1.1372, "step": 13769 }, { "epoch": 0.38, "learning_rate": 1.4349990849952486e-05, "loss": 1.4431, "step": 13770 }, { "epoch": 0.38, "learning_rate": 1.4349194395332869e-05, "loss": 1.3164, "step": 13771 }, { "epoch": 0.38, "learning_rate": 1.4348397906687197e-05, "loss": 1.4517, "step": 13772 }, { "epoch": 0.38, "learning_rate": 1.4347601384021705e-05, "loss": 1.2571, "step": 13773 }, { "epoch": 0.38, "learning_rate": 1.4346804827342627e-05, "loss": 1.4382, "step": 13774 }, { "epoch": 0.38, "learning_rate": 1.4346008236656189e-05, "loss": 1.3066, "step": 13775 }, { "epoch": 0.38, "learning_rate": 1.4345211611968627e-05, "loss": 1.3083, "step": 13776 }, { "epoch": 0.38, "learning_rate": 1.4344414953286172e-05, "loss": 1.4814, "step": 13777 }, { "epoch": 0.38, "learning_rate": 1.434361826061506e-05, "loss": 1.1404, "step": 13778 }, { "epoch": 0.38, "learning_rate": 1.4342821533961515e-05, "loss": 1.3884, "step": 13779 }, { "epoch": 0.38, "learning_rate": 1.4342024773331782e-05, "loss": 1.3237, "step": 13780 }, { "epoch": 0.38, "learning_rate": 1.4341227978732086e-05, "loss": 1.5298, "step": 13781 }, { "epoch": 0.38, "learning_rate": 1.4340431150168668e-05, "loss": 1.4023, "step": 13782 }, { "epoch": 0.38, "learning_rate": 1.4339634287647753e-05, "loss": 1.3462, "step": 13783 }, { "epoch": 0.38, "learning_rate": 1.4338837391175582e-05, "loss": 1.3174, "step": 13784 }, { "epoch": 0.38, "learning_rate": 1.4338040460758386e-05, "loss": 1.4287, "step": 13785 }, { "epoch": 0.38, "learning_rate": 1.4337243496402405e-05, "loss": 1.3042, "step": 13786 }, { "epoch": 0.38, "learning_rate": 1.4336446498113867e-05, "loss": 1.438, "step": 13787 }, { "epoch": 0.38, "learning_rate": 1.4335649465899013e-05, "loss": 1.3259, "step": 13788 }, { "epoch": 0.38, "learning_rate": 1.4334852399764075e-05, "loss": 1.4927, "step": 13789 }, { "epoch": 0.38, "learning_rate": 1.433405529971529e-05, "loss": 1.4475, "step": 13790 }, { "epoch": 0.38, "learning_rate": 1.4333258165758893e-05, "loss": 1.3804, "step": 13791 }, { "epoch": 0.38, "learning_rate": 1.4332460997901127e-05, "loss": 1.3586, "step": 13792 }, { "epoch": 0.38, "learning_rate": 1.4331663796148218e-05, "loss": 1.3027, "step": 13793 }, { "epoch": 0.38, "learning_rate": 1.433086656050641e-05, "loss": 1.3569, "step": 13794 }, { "epoch": 0.38, "learning_rate": 1.433006929098194e-05, "loss": 1.2764, "step": 13795 }, { "epoch": 0.38, "learning_rate": 1.4329271987581042e-05, "loss": 1.438, "step": 13796 }, { "epoch": 0.38, "learning_rate": 1.4328474650309958e-05, "loss": 1.498, "step": 13797 }, { "epoch": 0.38, "learning_rate": 1.4327677279174921e-05, "loss": 1.3311, "step": 13798 }, { "epoch": 0.38, "learning_rate": 1.4326879874182175e-05, "loss": 1.3977, "step": 13799 }, { "epoch": 0.38, "learning_rate": 1.432608243533795e-05, "loss": 1.3901, "step": 13800 }, { "epoch": 0.38, "learning_rate": 1.4325284962648499e-05, "loss": 1.4932, "step": 13801 }, { "epoch": 0.38, "learning_rate": 1.4324487456120045e-05, "loss": 1.1333, "step": 13802 }, { "epoch": 0.38, "learning_rate": 1.4323689915758839e-05, "loss": 1.4055, "step": 13803 }, { "epoch": 0.38, "learning_rate": 1.4322892341571113e-05, "loss": 1.3726, "step": 13804 }, { "epoch": 0.38, "learning_rate": 1.4322094733563112e-05, "loss": 1.3687, "step": 13805 }, { "epoch": 0.38, "learning_rate": 1.4321297091741073e-05, "loss": 1.1399, "step": 13806 }, { "epoch": 0.38, "learning_rate": 1.4320499416111239e-05, "loss": 1.3689, "step": 13807 }, { "epoch": 0.38, "learning_rate": 1.4319701706679848e-05, "loss": 1.1394, "step": 13808 }, { "epoch": 0.38, "learning_rate": 1.4318903963453141e-05, "loss": 1.3315, "step": 13809 }, { "epoch": 0.38, "learning_rate": 1.4318106186437362e-05, "loss": 1.3918, "step": 13810 }, { "epoch": 0.38, "learning_rate": 1.4317308375638752e-05, "loss": 1.3784, "step": 13811 }, { "epoch": 0.38, "learning_rate": 1.4316510531063547e-05, "loss": 1.4331, "step": 13812 }, { "epoch": 0.38, "learning_rate": 1.4315712652717999e-05, "loss": 1.3103, "step": 13813 }, { "epoch": 0.38, "learning_rate": 1.431491474060834e-05, "loss": 1.1335, "step": 13814 }, { "epoch": 0.38, "learning_rate": 1.431411679474082e-05, "loss": 1.1971, "step": 13815 }, { "epoch": 0.38, "learning_rate": 1.4313318815121677e-05, "loss": 1.2139, "step": 13816 }, { "epoch": 0.38, "learning_rate": 1.4312520801757158e-05, "loss": 1.1594, "step": 13817 }, { "epoch": 0.38, "learning_rate": 1.4311722754653504e-05, "loss": 1.416, "step": 13818 }, { "epoch": 0.38, "learning_rate": 1.4310924673816957e-05, "loss": 1.2014, "step": 13819 }, { "epoch": 0.38, "learning_rate": 1.431012655925376e-05, "loss": 1.3257, "step": 13820 }, { "epoch": 0.38, "learning_rate": 1.4309328410970164e-05, "loss": 1.3118, "step": 13821 }, { "epoch": 0.38, "learning_rate": 1.4308530228972408e-05, "loss": 1.2651, "step": 13822 }, { "epoch": 0.38, "learning_rate": 1.4307732013266738e-05, "loss": 1.4707, "step": 13823 }, { "epoch": 0.38, "learning_rate": 1.4306933763859396e-05, "loss": 1.2312, "step": 13824 }, { "epoch": 0.38, "learning_rate": 1.4306135480756628e-05, "loss": 1.1631, "step": 13825 }, { "epoch": 0.38, "learning_rate": 1.4305337163964685e-05, "loss": 1.3552, "step": 13826 }, { "epoch": 0.38, "learning_rate": 1.4304538813489808e-05, "loss": 1.3354, "step": 13827 }, { "epoch": 0.38, "learning_rate": 1.4303740429338242e-05, "loss": 1.2256, "step": 13828 }, { "epoch": 0.38, "learning_rate": 1.4302942011516236e-05, "loss": 1.3877, "step": 13829 }, { "epoch": 0.38, "learning_rate": 1.4302143560030035e-05, "loss": 1.3494, "step": 13830 }, { "epoch": 0.38, "learning_rate": 1.4301345074885884e-05, "loss": 1.071, "step": 13831 }, { "epoch": 0.38, "learning_rate": 1.4300546556090034e-05, "loss": 1.4944, "step": 13832 }, { "epoch": 0.38, "learning_rate": 1.4299748003648731e-05, "loss": 1.2615, "step": 13833 }, { "epoch": 0.38, "learning_rate": 1.4298949417568217e-05, "loss": 1.2842, "step": 13834 }, { "epoch": 0.38, "learning_rate": 1.429815079785475e-05, "loss": 1.2903, "step": 13835 }, { "epoch": 0.38, "learning_rate": 1.4297352144514566e-05, "loss": 1.3525, "step": 13836 }, { "epoch": 0.38, "learning_rate": 1.4296553457553923e-05, "loss": 1.386, "step": 13837 }, { "epoch": 0.38, "learning_rate": 1.4295754736979066e-05, "loss": 1.2886, "step": 13838 }, { "epoch": 0.38, "learning_rate": 1.4294955982796243e-05, "loss": 1.4087, "step": 13839 }, { "epoch": 0.38, "learning_rate": 1.4294157195011704e-05, "loss": 1.2336, "step": 13840 }, { "epoch": 0.38, "learning_rate": 1.4293358373631701e-05, "loss": 1.3093, "step": 13841 }, { "epoch": 0.38, "learning_rate": 1.4292559518662477e-05, "loss": 1.5923, "step": 13842 }, { "epoch": 0.38, "learning_rate": 1.429176063011029e-05, "loss": 1.8447, "step": 13843 }, { "epoch": 0.38, "learning_rate": 1.4290961707981382e-05, "loss": 1.239, "step": 13844 }, { "epoch": 0.38, "learning_rate": 1.429016275228201e-05, "loss": 1.4548, "step": 13845 }, { "epoch": 0.38, "learning_rate": 1.428936376301842e-05, "loss": 1.4333, "step": 13846 }, { "epoch": 0.38, "learning_rate": 1.4288564740196869e-05, "loss": 1.3967, "step": 13847 }, { "epoch": 0.38, "learning_rate": 1.4287765683823598e-05, "loss": 1.1543, "step": 13848 }, { "epoch": 0.38, "learning_rate": 1.428696659390487e-05, "loss": 1.2422, "step": 13849 }, { "epoch": 0.38, "learning_rate": 1.4286167470446927e-05, "loss": 1.3909, "step": 13850 }, { "epoch": 0.38, "learning_rate": 1.428536831345603e-05, "loss": 1.1658, "step": 13851 }, { "epoch": 0.38, "learning_rate": 1.428456912293842e-05, "loss": 1.3225, "step": 13852 }, { "epoch": 0.38, "learning_rate": 1.4283769898900362e-05, "loss": 1.2375, "step": 13853 }, { "epoch": 0.38, "learning_rate": 1.42829706413481e-05, "loss": 1.3208, "step": 13854 }, { "epoch": 0.38, "learning_rate": 1.428217135028789e-05, "loss": 1.3403, "step": 13855 }, { "epoch": 0.38, "learning_rate": 1.4281372025725983e-05, "loss": 1.2305, "step": 13856 }, { "epoch": 0.38, "learning_rate": 1.4280572667668637e-05, "loss": 1.2332, "step": 13857 }, { "epoch": 0.38, "learning_rate": 1.4279773276122105e-05, "loss": 1.2837, "step": 13858 }, { "epoch": 0.38, "learning_rate": 1.4278973851092635e-05, "loss": 1.363, "step": 13859 }, { "epoch": 0.38, "learning_rate": 1.4278174392586488e-05, "loss": 1.2646, "step": 13860 }, { "epoch": 0.38, "learning_rate": 1.4277374900609914e-05, "loss": 1.3101, "step": 13861 }, { "epoch": 0.38, "learning_rate": 1.4276575375169174e-05, "loss": 1.4719, "step": 13862 }, { "epoch": 0.38, "learning_rate": 1.4275775816270518e-05, "loss": 1.3411, "step": 13863 }, { "epoch": 0.38, "learning_rate": 1.4274976223920203e-05, "loss": 1.5215, "step": 13864 }, { "epoch": 0.38, "learning_rate": 1.4274176598124483e-05, "loss": 1.2737, "step": 13865 }, { "epoch": 0.38, "learning_rate": 1.4273376938889615e-05, "loss": 1.2957, "step": 13866 }, { "epoch": 0.38, "learning_rate": 1.4272577246221858e-05, "loss": 1.209, "step": 13867 }, { "epoch": 0.38, "learning_rate": 1.4271777520127464e-05, "loss": 1.3547, "step": 13868 }, { "epoch": 0.38, "learning_rate": 1.427097776061269e-05, "loss": 1.4258, "step": 13869 }, { "epoch": 0.38, "learning_rate": 1.4270177967683797e-05, "loss": 1.2185, "step": 13870 }, { "epoch": 0.38, "learning_rate": 1.4269378141347035e-05, "loss": 1.3391, "step": 13871 }, { "epoch": 0.38, "learning_rate": 1.4268578281608669e-05, "loss": 1.4683, "step": 13872 }, { "epoch": 0.38, "learning_rate": 1.4267778388474953e-05, "loss": 1.4705, "step": 13873 }, { "epoch": 0.38, "learning_rate": 1.4266978461952148e-05, "loss": 1.2854, "step": 13874 }, { "epoch": 0.38, "learning_rate": 1.4266178502046506e-05, "loss": 1.3496, "step": 13875 }, { "epoch": 0.38, "learning_rate": 1.4265378508764294e-05, "loss": 1.3745, "step": 13876 }, { "epoch": 0.38, "learning_rate": 1.4264578482111762e-05, "loss": 1.3082, "step": 13877 }, { "epoch": 0.38, "learning_rate": 1.4263778422095178e-05, "loss": 1.3623, "step": 13878 }, { "epoch": 0.38, "learning_rate": 1.4262978328720794e-05, "loss": 1.438, "step": 13879 }, { "epoch": 0.38, "learning_rate": 1.4262178201994871e-05, "loss": 1.3303, "step": 13880 }, { "epoch": 0.38, "learning_rate": 1.4261378041923672e-05, "loss": 1.3164, "step": 13881 }, { "epoch": 0.38, "learning_rate": 1.4260577848513455e-05, "loss": 1.2581, "step": 13882 }, { "epoch": 0.38, "learning_rate": 1.4259777621770478e-05, "loss": 1.304, "step": 13883 }, { "epoch": 0.38, "learning_rate": 1.4258977361701008e-05, "loss": 1.2383, "step": 13884 }, { "epoch": 0.38, "learning_rate": 1.4258177068311297e-05, "loss": 1.2759, "step": 13885 }, { "epoch": 0.38, "learning_rate": 1.4257376741607616e-05, "loss": 1.3501, "step": 13886 }, { "epoch": 0.38, "learning_rate": 1.4256576381596216e-05, "loss": 1.3696, "step": 13887 }, { "epoch": 0.38, "learning_rate": 1.4255775988283367e-05, "loss": 1.3137, "step": 13888 }, { "epoch": 0.38, "learning_rate": 1.4254975561675326e-05, "loss": 1.2346, "step": 13889 }, { "epoch": 0.38, "learning_rate": 1.425417510177836e-05, "loss": 1.2253, "step": 13890 }, { "epoch": 0.38, "learning_rate": 1.4253374608598726e-05, "loss": 1.373, "step": 13891 }, { "epoch": 0.38, "learning_rate": 1.4252574082142692e-05, "loss": 1.3103, "step": 13892 }, { "epoch": 0.38, "learning_rate": 1.4251773522416514e-05, "loss": 1.2793, "step": 13893 }, { "epoch": 0.38, "learning_rate": 1.4250972929426462e-05, "loss": 1.2041, "step": 13894 }, { "epoch": 0.38, "learning_rate": 1.4250172303178797e-05, "loss": 1.4519, "step": 13895 }, { "epoch": 0.38, "learning_rate": 1.4249371643679783e-05, "loss": 1.2986, "step": 13896 }, { "epoch": 0.38, "learning_rate": 1.4248570950935681e-05, "loss": 1.2739, "step": 13897 }, { "epoch": 0.38, "learning_rate": 1.4247770224952761e-05, "loss": 1.3384, "step": 13898 }, { "epoch": 0.38, "learning_rate": 1.424696946573728e-05, "loss": 1.2859, "step": 13899 }, { "epoch": 0.38, "learning_rate": 1.424616867329551e-05, "loss": 1.387, "step": 13900 }, { "epoch": 0.38, "learning_rate": 1.4245367847633711e-05, "loss": 1.2603, "step": 13901 }, { "epoch": 0.38, "learning_rate": 1.4244566988758152e-05, "loss": 1.2505, "step": 13902 }, { "epoch": 0.38, "learning_rate": 1.4243766096675095e-05, "loss": 1.3767, "step": 13903 }, { "epoch": 0.38, "learning_rate": 1.424296517139081e-05, "loss": 1.2764, "step": 13904 }, { "epoch": 0.38, "learning_rate": 1.424216421291156e-05, "loss": 1.53, "step": 13905 }, { "epoch": 0.38, "learning_rate": 1.4241363221243611e-05, "loss": 1.2915, "step": 13906 }, { "epoch": 0.38, "learning_rate": 1.424056219639323e-05, "loss": 1.2605, "step": 13907 }, { "epoch": 0.38, "learning_rate": 1.4239761138366688e-05, "loss": 1.1826, "step": 13908 }, { "epoch": 0.38, "learning_rate": 1.4238960047170244e-05, "loss": 1.354, "step": 13909 }, { "epoch": 0.38, "learning_rate": 1.4238158922810172e-05, "loss": 1.2134, "step": 13910 }, { "epoch": 0.38, "learning_rate": 1.4237357765292739e-05, "loss": 1.3428, "step": 13911 }, { "epoch": 0.38, "learning_rate": 1.423655657462421e-05, "loss": 1.3831, "step": 13912 }, { "epoch": 0.38, "learning_rate": 1.4235755350810854e-05, "loss": 1.3296, "step": 13913 }, { "epoch": 0.38, "learning_rate": 1.423495409385894e-05, "loss": 1.2847, "step": 13914 }, { "epoch": 0.38, "learning_rate": 1.4234152803774736e-05, "loss": 1.2007, "step": 13915 }, { "epoch": 0.38, "learning_rate": 1.4233351480564515e-05, "loss": 1.3601, "step": 13916 }, { "epoch": 0.38, "learning_rate": 1.4232550124234539e-05, "loss": 1.2344, "step": 13917 }, { "epoch": 0.38, "learning_rate": 1.4231748734791083e-05, "loss": 1.2683, "step": 13918 }, { "epoch": 0.38, "learning_rate": 1.4230947312240413e-05, "loss": 1.2896, "step": 13919 }, { "epoch": 0.38, "learning_rate": 1.42301458565888e-05, "loss": 1.3223, "step": 13920 }, { "epoch": 0.38, "learning_rate": 1.4229344367842517e-05, "loss": 1.3484, "step": 13921 }, { "epoch": 0.38, "learning_rate": 1.4228542846007832e-05, "loss": 1.4443, "step": 13922 }, { "epoch": 0.38, "learning_rate": 1.4227741291091017e-05, "loss": 1.3669, "step": 13923 }, { "epoch": 0.38, "learning_rate": 1.4226939703098342e-05, "loss": 1.1127, "step": 13924 }, { "epoch": 0.38, "learning_rate": 1.4226138082036078e-05, "loss": 1.3008, "step": 13925 }, { "epoch": 0.38, "learning_rate": 1.4225336427910494e-05, "loss": 1.3091, "step": 13926 }, { "epoch": 0.38, "learning_rate": 1.4224534740727868e-05, "loss": 1.4053, "step": 13927 }, { "epoch": 0.38, "learning_rate": 1.422373302049447e-05, "loss": 1.3086, "step": 13928 }, { "epoch": 0.38, "learning_rate": 1.4222931267216571e-05, "loss": 1.4009, "step": 13929 }, { "epoch": 0.38, "learning_rate": 1.422212948090044e-05, "loss": 1.2773, "step": 13930 }, { "epoch": 0.38, "learning_rate": 1.4221327661552355e-05, "loss": 1.3174, "step": 13931 }, { "epoch": 0.38, "learning_rate": 1.4220525809178586e-05, "loss": 1.3372, "step": 13932 }, { "epoch": 0.38, "learning_rate": 1.4219723923785411e-05, "loss": 1.4575, "step": 13933 }, { "epoch": 0.38, "learning_rate": 1.4218922005379097e-05, "loss": 1.4534, "step": 13934 }, { "epoch": 0.38, "learning_rate": 1.4218120053965923e-05, "loss": 1.387, "step": 13935 }, { "epoch": 0.38, "learning_rate": 1.421731806955216e-05, "loss": 1.353, "step": 13936 }, { "epoch": 0.38, "learning_rate": 1.4216516052144084e-05, "loss": 1.2375, "step": 13937 }, { "epoch": 0.38, "learning_rate": 1.421571400174797e-05, "loss": 1.3396, "step": 13938 }, { "epoch": 0.38, "learning_rate": 1.4214911918370091e-05, "loss": 1.2632, "step": 13939 }, { "epoch": 0.38, "learning_rate": 1.4214109802016722e-05, "loss": 1.1609, "step": 13940 }, { "epoch": 0.38, "learning_rate": 1.4213307652694144e-05, "loss": 1.217, "step": 13941 }, { "epoch": 0.38, "learning_rate": 1.4212505470408624e-05, "loss": 1.4033, "step": 13942 }, { "epoch": 0.38, "learning_rate": 1.4211703255166444e-05, "loss": 1.2898, "step": 13943 }, { "epoch": 0.38, "learning_rate": 1.4210901006973876e-05, "loss": 1.2312, "step": 13944 }, { "epoch": 0.38, "learning_rate": 1.4210098725837202e-05, "loss": 1.3318, "step": 13945 }, { "epoch": 0.38, "learning_rate": 1.4209296411762692e-05, "loss": 1.4775, "step": 13946 }, { "epoch": 0.38, "learning_rate": 1.4208494064756627e-05, "loss": 1.2878, "step": 13947 }, { "epoch": 0.38, "learning_rate": 1.4207691684825284e-05, "loss": 1.3394, "step": 13948 }, { "epoch": 0.38, "learning_rate": 1.4206889271974942e-05, "loss": 1.6816, "step": 13949 }, { "epoch": 0.38, "learning_rate": 1.4206086826211874e-05, "loss": 1.6187, "step": 13950 }, { "epoch": 0.38, "learning_rate": 1.4205284347542359e-05, "loss": 1.374, "step": 13951 }, { "epoch": 0.38, "learning_rate": 1.4204481835972681e-05, "loss": 1.334, "step": 13952 }, { "epoch": 0.38, "learning_rate": 1.4203679291509111e-05, "loss": 1.438, "step": 13953 }, { "epoch": 0.38, "learning_rate": 1.4202876714157934e-05, "loss": 1.3369, "step": 13954 }, { "epoch": 0.38, "learning_rate": 1.4202074103925421e-05, "loss": 1.1724, "step": 13955 }, { "epoch": 0.38, "learning_rate": 1.420127146081786e-05, "loss": 1.3267, "step": 13956 }, { "epoch": 0.38, "learning_rate": 1.4200468784841526e-05, "loss": 1.272, "step": 13957 }, { "epoch": 0.38, "learning_rate": 1.4199666076002699e-05, "loss": 1.3931, "step": 13958 }, { "epoch": 0.38, "learning_rate": 1.4198863334307658e-05, "loss": 1.3108, "step": 13959 }, { "epoch": 0.38, "learning_rate": 1.4198060559762685e-05, "loss": 1.2791, "step": 13960 }, { "epoch": 0.38, "learning_rate": 1.4197257752374062e-05, "loss": 1.2886, "step": 13961 }, { "epoch": 0.38, "learning_rate": 1.4196454912148068e-05, "loss": 1.3516, "step": 13962 }, { "epoch": 0.38, "learning_rate": 1.4195652039090986e-05, "loss": 1.4038, "step": 13963 }, { "epoch": 0.38, "learning_rate": 1.419484913320909e-05, "loss": 1.4309, "step": 13964 }, { "epoch": 0.38, "learning_rate": 1.419404619450867e-05, "loss": 1.3455, "step": 13965 }, { "epoch": 0.38, "learning_rate": 1.4193243222996005e-05, "loss": 1.2324, "step": 13966 }, { "epoch": 0.38, "learning_rate": 1.4192440218677377e-05, "loss": 1.2744, "step": 13967 }, { "epoch": 0.38, "learning_rate": 1.4191637181559069e-05, "loss": 1.4001, "step": 13968 }, { "epoch": 0.38, "learning_rate": 1.4190834111647358e-05, "loss": 1.3015, "step": 13969 }, { "epoch": 0.38, "learning_rate": 1.4190031008948537e-05, "loss": 1.3069, "step": 13970 }, { "epoch": 0.38, "learning_rate": 1.4189227873468881e-05, "loss": 1.3887, "step": 13971 }, { "epoch": 0.38, "learning_rate": 1.4188424705214679e-05, "loss": 1.3748, "step": 13972 }, { "epoch": 0.38, "learning_rate": 1.4187621504192208e-05, "loss": 1.2773, "step": 13973 }, { "epoch": 0.38, "learning_rate": 1.4186818270407756e-05, "loss": 1.3201, "step": 13974 }, { "epoch": 0.38, "learning_rate": 1.4186015003867609e-05, "loss": 1.2722, "step": 13975 }, { "epoch": 0.38, "learning_rate": 1.4185211704578046e-05, "loss": 1.3306, "step": 13976 }, { "epoch": 0.38, "learning_rate": 1.4184408372545356e-05, "loss": 1.1536, "step": 13977 }, { "epoch": 0.38, "learning_rate": 1.4183605007775825e-05, "loss": 1.3311, "step": 13978 }, { "epoch": 0.38, "learning_rate": 1.4182801610275731e-05, "loss": 1.1233, "step": 13979 }, { "epoch": 0.38, "learning_rate": 1.4181998180051368e-05, "loss": 1.4319, "step": 13980 }, { "epoch": 0.38, "learning_rate": 1.4181194717109012e-05, "loss": 1.4248, "step": 13981 }, { "epoch": 0.38, "learning_rate": 1.4180391221454961e-05, "loss": 1.3706, "step": 13982 }, { "epoch": 0.38, "learning_rate": 1.4179587693095492e-05, "loss": 1.321, "step": 13983 }, { "epoch": 0.38, "learning_rate": 1.4178784132036895e-05, "loss": 1.3921, "step": 13984 }, { "epoch": 0.38, "learning_rate": 1.4177980538285456e-05, "loss": 1.3716, "step": 13985 }, { "epoch": 0.38, "learning_rate": 1.4177176911847461e-05, "loss": 1.2996, "step": 13986 }, { "epoch": 0.38, "learning_rate": 1.4176373252729198e-05, "loss": 1.2908, "step": 13987 }, { "epoch": 0.38, "learning_rate": 1.4175569560936956e-05, "loss": 1.1418, "step": 13988 }, { "epoch": 0.38, "learning_rate": 1.417476583647702e-05, "loss": 1.4788, "step": 13989 }, { "epoch": 0.38, "learning_rate": 1.4173962079355684e-05, "loss": 1.4521, "step": 13990 }, { "epoch": 0.38, "learning_rate": 1.4173158289579225e-05, "loss": 1.314, "step": 13991 }, { "epoch": 0.38, "learning_rate": 1.4172354467153942e-05, "loss": 1.1689, "step": 13992 }, { "epoch": 0.38, "learning_rate": 1.4171550612086116e-05, "loss": 1.3672, "step": 13993 }, { "epoch": 0.38, "learning_rate": 1.4170746724382043e-05, "loss": 1.2903, "step": 13994 }, { "epoch": 0.38, "learning_rate": 1.4169942804048007e-05, "loss": 1.3337, "step": 13995 }, { "epoch": 0.38, "learning_rate": 1.4169138851090298e-05, "loss": 1.3279, "step": 13996 }, { "epoch": 0.38, "learning_rate": 1.4168334865515207e-05, "loss": 1.3533, "step": 13997 }, { "epoch": 0.38, "learning_rate": 1.4167530847329027e-05, "loss": 1.4037, "step": 13998 }, { "epoch": 0.38, "learning_rate": 1.4166726796538044e-05, "loss": 1.2153, "step": 13999 }, { "epoch": 0.38, "learning_rate": 1.4165922713148549e-05, "loss": 1.2617, "step": 14000 }, { "epoch": 0.38, "learning_rate": 1.4165118597166836e-05, "loss": 1.3193, "step": 14001 }, { "epoch": 0.38, "learning_rate": 1.4164314448599192e-05, "loss": 1.3723, "step": 14002 }, { "epoch": 0.38, "learning_rate": 1.416351026745191e-05, "loss": 1.3296, "step": 14003 }, { "epoch": 0.38, "learning_rate": 1.4162706053731283e-05, "loss": 1.325, "step": 14004 }, { "epoch": 0.38, "learning_rate": 1.4161901807443598e-05, "loss": 1.2568, "step": 14005 }, { "epoch": 0.38, "learning_rate": 1.4161097528595155e-05, "loss": 1.3506, "step": 14006 }, { "epoch": 0.38, "learning_rate": 1.4160293217192238e-05, "loss": 1.1913, "step": 14007 }, { "epoch": 0.38, "learning_rate": 1.4159488873241146e-05, "loss": 1.4172, "step": 14008 }, { "epoch": 0.38, "learning_rate": 1.4158684496748166e-05, "loss": 1.3601, "step": 14009 }, { "epoch": 0.38, "learning_rate": 1.4157880087719595e-05, "loss": 1.2461, "step": 14010 }, { "epoch": 0.38, "learning_rate": 1.4157075646161727e-05, "loss": 1.2273, "step": 14011 }, { "epoch": 0.38, "learning_rate": 1.4156271172080851e-05, "loss": 1.3293, "step": 14012 }, { "epoch": 0.38, "learning_rate": 1.4155466665483267e-05, "loss": 1.325, "step": 14013 }, { "epoch": 0.38, "learning_rate": 1.4154662126375262e-05, "loss": 1.2852, "step": 14014 }, { "epoch": 0.38, "learning_rate": 1.4153857554763137e-05, "loss": 1.2729, "step": 14015 }, { "epoch": 0.38, "learning_rate": 1.4153052950653183e-05, "loss": 1.4199, "step": 14016 }, { "epoch": 0.38, "learning_rate": 1.4152248314051695e-05, "loss": 1.3301, "step": 14017 }, { "epoch": 0.38, "learning_rate": 1.4151443644964971e-05, "loss": 1.2532, "step": 14018 }, { "epoch": 0.38, "learning_rate": 1.4150638943399302e-05, "loss": 1.272, "step": 14019 }, { "epoch": 0.38, "learning_rate": 1.4149834209360987e-05, "loss": 1.3645, "step": 14020 }, { "epoch": 0.38, "learning_rate": 1.4149029442856318e-05, "loss": 1.2346, "step": 14021 }, { "epoch": 0.38, "learning_rate": 1.4148224643891597e-05, "loss": 1.334, "step": 14022 }, { "epoch": 0.38, "learning_rate": 1.4147419812473115e-05, "loss": 1.3906, "step": 14023 }, { "epoch": 0.38, "learning_rate": 1.414661494860717e-05, "loss": 1.2888, "step": 14024 }, { "epoch": 0.38, "learning_rate": 1.4145810052300061e-05, "loss": 1.4167, "step": 14025 }, { "epoch": 0.38, "learning_rate": 1.4145005123558085e-05, "loss": 1.6777, "step": 14026 }, { "epoch": 0.38, "learning_rate": 1.4144200162387533e-05, "loss": 1.3457, "step": 14027 }, { "epoch": 0.38, "learning_rate": 1.4143395168794712e-05, "loss": 1.3992, "step": 14028 }, { "epoch": 0.38, "learning_rate": 1.4142590142785914e-05, "loss": 1.4316, "step": 14029 }, { "epoch": 0.38, "learning_rate": 1.4141785084367439e-05, "loss": 1.3833, "step": 14030 }, { "epoch": 0.38, "learning_rate": 1.4140979993545588e-05, "loss": 1.2742, "step": 14031 }, { "epoch": 0.38, "learning_rate": 1.4140174870326651e-05, "loss": 1.1709, "step": 14032 }, { "epoch": 0.38, "learning_rate": 1.4139369714716937e-05, "loss": 1.3306, "step": 14033 }, { "epoch": 0.38, "learning_rate": 1.413856452672274e-05, "loss": 1.1582, "step": 14034 }, { "epoch": 0.38, "learning_rate": 1.413775930635036e-05, "loss": 1.4463, "step": 14035 }, { "epoch": 0.38, "learning_rate": 1.4136954053606096e-05, "loss": 1.2061, "step": 14036 }, { "epoch": 0.38, "learning_rate": 1.413614876849625e-05, "loss": 1.4004, "step": 14037 }, { "epoch": 0.38, "learning_rate": 1.4135343451027119e-05, "loss": 1.2241, "step": 14038 }, { "epoch": 0.38, "learning_rate": 1.4134538101205008e-05, "loss": 1.3684, "step": 14039 }, { "epoch": 0.38, "learning_rate": 1.4133732719036212e-05, "loss": 1.1946, "step": 14040 }, { "epoch": 0.38, "learning_rate": 1.413292730452704e-05, "loss": 1.3743, "step": 14041 }, { "epoch": 0.38, "learning_rate": 1.4132121857683782e-05, "loss": 1.3792, "step": 14042 }, { "epoch": 0.38, "learning_rate": 1.413131637851275e-05, "loss": 1.6372, "step": 14043 }, { "epoch": 0.38, "learning_rate": 1.413051086702024e-05, "loss": 1.4375, "step": 14044 }, { "epoch": 0.38, "learning_rate": 1.4129705323212555e-05, "loss": 1.2385, "step": 14045 }, { "epoch": 0.38, "learning_rate": 1.4128899747095997e-05, "loss": 1.2446, "step": 14046 }, { "epoch": 0.38, "learning_rate": 1.412809413867687e-05, "loss": 1.1843, "step": 14047 }, { "epoch": 0.38, "learning_rate": 1.4127288497961476e-05, "loss": 1.2764, "step": 14048 }, { "epoch": 0.38, "learning_rate": 1.4126482824956118e-05, "loss": 1.4177, "step": 14049 }, { "epoch": 0.38, "learning_rate": 1.4125677119667098e-05, "loss": 1.3945, "step": 14050 }, { "epoch": 0.38, "learning_rate": 1.412487138210072e-05, "loss": 1.4707, "step": 14051 }, { "epoch": 0.38, "learning_rate": 1.4124065612263287e-05, "loss": 1.345, "step": 14052 }, { "epoch": 0.38, "learning_rate": 1.4123259810161107e-05, "loss": 1.2307, "step": 14053 }, { "epoch": 0.38, "learning_rate": 1.4122453975800477e-05, "loss": 1.2791, "step": 14054 }, { "epoch": 0.38, "learning_rate": 1.4121648109187709e-05, "loss": 1.4861, "step": 14055 }, { "epoch": 0.38, "learning_rate": 1.4120842210329103e-05, "loss": 1.3768, "step": 14056 }, { "epoch": 0.38, "learning_rate": 1.4120036279230966e-05, "loss": 1.3918, "step": 14057 }, { "epoch": 0.38, "learning_rate": 1.4119230315899602e-05, "loss": 1.2334, "step": 14058 }, { "epoch": 0.38, "learning_rate": 1.4118424320341316e-05, "loss": 1.251, "step": 14059 }, { "epoch": 0.38, "learning_rate": 1.4117618292562416e-05, "loss": 1.3604, "step": 14060 }, { "epoch": 0.38, "learning_rate": 1.4116812232569204e-05, "loss": 1.1682, "step": 14061 }, { "epoch": 0.38, "learning_rate": 1.4116006140367992e-05, "loss": 1.3113, "step": 14062 }, { "epoch": 0.38, "learning_rate": 1.4115200015965082e-05, "loss": 1.1021, "step": 14063 }, { "epoch": 0.38, "learning_rate": 1.4114393859366785e-05, "loss": 1.2363, "step": 14064 }, { "epoch": 0.38, "learning_rate": 1.4113587670579402e-05, "loss": 1.4456, "step": 14065 }, { "epoch": 0.38, "learning_rate": 1.4112781449609245e-05, "loss": 1.2312, "step": 14066 }, { "epoch": 0.38, "learning_rate": 1.4111975196462619e-05, "loss": 1.459, "step": 14067 }, { "epoch": 0.38, "learning_rate": 1.4111168911145834e-05, "loss": 1.2568, "step": 14068 }, { "epoch": 0.38, "learning_rate": 1.4110362593665197e-05, "loss": 1.3462, "step": 14069 }, { "epoch": 0.38, "learning_rate": 1.4109556244027013e-05, "loss": 1.2063, "step": 14070 }, { "epoch": 0.38, "learning_rate": 1.4108749862237594e-05, "loss": 1.1184, "step": 14071 }, { "epoch": 0.38, "learning_rate": 1.410794344830325e-05, "loss": 1.3823, "step": 14072 }, { "epoch": 0.38, "learning_rate": 1.4107137002230289e-05, "loss": 1.3169, "step": 14073 }, { "epoch": 0.38, "learning_rate": 1.4106330524025016e-05, "loss": 1.1624, "step": 14074 }, { "epoch": 0.38, "learning_rate": 1.4105524013693742e-05, "loss": 1.3618, "step": 14075 }, { "epoch": 0.38, "learning_rate": 1.4104717471242786e-05, "loss": 1.3511, "step": 14076 }, { "epoch": 0.38, "learning_rate": 1.4103910896678446e-05, "loss": 1.387, "step": 14077 }, { "epoch": 0.38, "learning_rate": 1.4103104290007039e-05, "loss": 1.478, "step": 14078 }, { "epoch": 0.38, "learning_rate": 1.410229765123487e-05, "loss": 1.4639, "step": 14079 }, { "epoch": 0.38, "learning_rate": 1.4101490980368257e-05, "loss": 1.2781, "step": 14080 }, { "epoch": 0.38, "learning_rate": 1.4100684277413505e-05, "loss": 1.3384, "step": 14081 }, { "epoch": 0.38, "learning_rate": 1.409987754237693e-05, "loss": 1.3552, "step": 14082 }, { "epoch": 0.38, "learning_rate": 1.4099070775264838e-05, "loss": 1.282, "step": 14083 }, { "epoch": 0.38, "learning_rate": 1.4098263976083545e-05, "loss": 1.2705, "step": 14084 }, { "epoch": 0.38, "learning_rate": 1.4097457144839362e-05, "loss": 1.3059, "step": 14085 }, { "epoch": 0.38, "learning_rate": 1.4096650281538602e-05, "loss": 1.2527, "step": 14086 }, { "epoch": 0.38, "learning_rate": 1.4095843386187575e-05, "loss": 1.2817, "step": 14087 }, { "epoch": 0.38, "learning_rate": 1.4095036458792597e-05, "loss": 1.2333, "step": 14088 }, { "epoch": 0.38, "learning_rate": 1.4094229499359976e-05, "loss": 1.3811, "step": 14089 }, { "epoch": 0.38, "learning_rate": 1.409342250789603e-05, "loss": 1.3748, "step": 14090 }, { "epoch": 0.38, "learning_rate": 1.409261548440707e-05, "loss": 1.3049, "step": 14091 }, { "epoch": 0.38, "learning_rate": 1.4091808428899417e-05, "loss": 1.2244, "step": 14092 }, { "epoch": 0.38, "learning_rate": 1.4091001341379374e-05, "loss": 1.3335, "step": 14093 }, { "epoch": 0.38, "learning_rate": 1.4090194221853262e-05, "loss": 1.3672, "step": 14094 }, { "epoch": 0.38, "learning_rate": 1.4089387070327391e-05, "loss": 1.3772, "step": 14095 }, { "epoch": 0.38, "learning_rate": 1.4088579886808083e-05, "loss": 1.4243, "step": 14096 }, { "epoch": 0.38, "learning_rate": 1.4087772671301643e-05, "loss": 1.4873, "step": 14097 }, { "epoch": 0.39, "learning_rate": 1.4086965423814396e-05, "loss": 1.3442, "step": 14098 }, { "epoch": 0.39, "learning_rate": 1.408615814435265e-05, "loss": 1.3284, "step": 14099 }, { "epoch": 0.39, "learning_rate": 1.4085350832922729e-05, "loss": 1.2195, "step": 14100 }, { "epoch": 0.39, "learning_rate": 1.408454348953094e-05, "loss": 1.2969, "step": 14101 }, { "epoch": 0.39, "learning_rate": 1.4083736114183606e-05, "loss": 1.334, "step": 14102 }, { "epoch": 0.39, "learning_rate": 1.4082928706887038e-05, "loss": 1.1635, "step": 14103 }, { "epoch": 0.39, "learning_rate": 1.4082121267647559e-05, "loss": 1.3169, "step": 14104 }, { "epoch": 0.39, "learning_rate": 1.4081313796471478e-05, "loss": 1.2729, "step": 14105 }, { "epoch": 0.39, "learning_rate": 1.4080506293365121e-05, "loss": 1.4397, "step": 14106 }, { "epoch": 0.39, "learning_rate": 1.40796987583348e-05, "loss": 1.3132, "step": 14107 }, { "epoch": 0.39, "learning_rate": 1.4078891191386839e-05, "loss": 1.2793, "step": 14108 }, { "epoch": 0.39, "learning_rate": 1.4078083592527545e-05, "loss": 1.7544, "step": 14109 }, { "epoch": 0.39, "learning_rate": 1.4077275961763246e-05, "loss": 1.2866, "step": 14110 }, { "epoch": 0.39, "learning_rate": 1.4076468299100255e-05, "loss": 1.2439, "step": 14111 }, { "epoch": 0.39, "learning_rate": 1.4075660604544896e-05, "loss": 1.4976, "step": 14112 }, { "epoch": 0.39, "learning_rate": 1.4074852878103483e-05, "loss": 1.3613, "step": 14113 }, { "epoch": 0.39, "learning_rate": 1.4074045119782338e-05, "loss": 1.3481, "step": 14114 }, { "epoch": 0.39, "learning_rate": 1.4073237329587776e-05, "loss": 1.3464, "step": 14115 }, { "epoch": 0.39, "learning_rate": 1.4072429507526127e-05, "loss": 1.5117, "step": 14116 }, { "epoch": 0.39, "learning_rate": 1.40716216536037e-05, "loss": 1.4082, "step": 14117 }, { "epoch": 0.39, "learning_rate": 1.4070813767826822e-05, "loss": 1.2966, "step": 14118 }, { "epoch": 0.39, "learning_rate": 1.4070005850201809e-05, "loss": 1.3713, "step": 14119 }, { "epoch": 0.39, "learning_rate": 1.4069197900734983e-05, "loss": 1.4341, "step": 14120 }, { "epoch": 0.39, "learning_rate": 1.406838991943267e-05, "loss": 1.3086, "step": 14121 }, { "epoch": 0.39, "learning_rate": 1.4067581906301185e-05, "loss": 1.4944, "step": 14122 }, { "epoch": 0.39, "learning_rate": 1.4066773861346854e-05, "loss": 1.3706, "step": 14123 }, { "epoch": 0.39, "learning_rate": 1.4065965784575995e-05, "loss": 1.3059, "step": 14124 }, { "epoch": 0.39, "learning_rate": 1.4065157675994931e-05, "loss": 1.3499, "step": 14125 }, { "epoch": 0.39, "learning_rate": 1.4064349535609987e-05, "loss": 1.1619, "step": 14126 }, { "epoch": 0.39, "learning_rate": 1.4063541363427483e-05, "loss": 1.1699, "step": 14127 }, { "epoch": 0.39, "learning_rate": 1.4062733159453741e-05, "loss": 1.4111, "step": 14128 }, { "epoch": 0.39, "learning_rate": 1.4061924923695084e-05, "loss": 1.4226, "step": 14129 }, { "epoch": 0.39, "learning_rate": 1.4061116656157839e-05, "loss": 1.4341, "step": 14130 }, { "epoch": 0.39, "learning_rate": 1.4060308356848326e-05, "loss": 1.2139, "step": 14131 }, { "epoch": 0.39, "learning_rate": 1.405950002577287e-05, "loss": 1.2712, "step": 14132 }, { "epoch": 0.39, "learning_rate": 1.4058691662937795e-05, "loss": 1.4834, "step": 14133 }, { "epoch": 0.39, "learning_rate": 1.4057883268349424e-05, "loss": 1.3154, "step": 14134 }, { "epoch": 0.39, "learning_rate": 1.4057074842014084e-05, "loss": 1.4653, "step": 14135 }, { "epoch": 0.39, "learning_rate": 1.4056266383938093e-05, "loss": 1.1809, "step": 14136 }, { "epoch": 0.39, "learning_rate": 1.4055457894127786e-05, "loss": 1.1917, "step": 14137 }, { "epoch": 0.39, "learning_rate": 1.4054649372589482e-05, "loss": 1.3145, "step": 14138 }, { "epoch": 0.39, "learning_rate": 1.405384081932951e-05, "loss": 1.2456, "step": 14139 }, { "epoch": 0.39, "learning_rate": 1.4053032234354191e-05, "loss": 1.3042, "step": 14140 }, { "epoch": 0.39, "learning_rate": 1.4052223617669856e-05, "loss": 1.3918, "step": 14141 }, { "epoch": 0.39, "learning_rate": 1.4051414969282828e-05, "loss": 1.2947, "step": 14142 }, { "epoch": 0.39, "learning_rate": 1.4050606289199436e-05, "loss": 1.498, "step": 14143 }, { "epoch": 0.39, "learning_rate": 1.4049797577426003e-05, "loss": 1.3633, "step": 14144 }, { "epoch": 0.39, "learning_rate": 1.4048988833968858e-05, "loss": 1.3157, "step": 14145 }, { "epoch": 0.39, "learning_rate": 1.4048180058834328e-05, "loss": 1.3491, "step": 14146 }, { "epoch": 0.39, "learning_rate": 1.4047371252028742e-05, "loss": 1.1807, "step": 14147 }, { "epoch": 0.39, "learning_rate": 1.4046562413558427e-05, "loss": 1.7422, "step": 14148 }, { "epoch": 0.39, "learning_rate": 1.404575354342971e-05, "loss": 1.4233, "step": 14149 }, { "epoch": 0.39, "learning_rate": 1.4044944641648918e-05, "loss": 1.2649, "step": 14150 }, { "epoch": 0.39, "learning_rate": 1.4044135708222381e-05, "loss": 1.2268, "step": 14151 }, { "epoch": 0.39, "learning_rate": 1.404332674315643e-05, "loss": 1.396, "step": 14152 }, { "epoch": 0.39, "learning_rate": 1.4042517746457391e-05, "loss": 1.8877, "step": 14153 }, { "epoch": 0.39, "learning_rate": 1.4041708718131595e-05, "loss": 1.2771, "step": 14154 }, { "epoch": 0.39, "learning_rate": 1.4040899658185371e-05, "loss": 1.2881, "step": 14155 }, { "epoch": 0.39, "learning_rate": 1.4040090566625047e-05, "loss": 1.7432, "step": 14156 }, { "epoch": 0.39, "learning_rate": 1.4039281443456957e-05, "loss": 1.1487, "step": 14157 }, { "epoch": 0.39, "learning_rate": 1.4038472288687422e-05, "loss": 1.4045, "step": 14158 }, { "epoch": 0.39, "learning_rate": 1.4037663102322784e-05, "loss": 1.3301, "step": 14159 }, { "epoch": 0.39, "learning_rate": 1.4036853884369366e-05, "loss": 1.1873, "step": 14160 }, { "epoch": 0.39, "learning_rate": 1.4036044634833506e-05, "loss": 1.3406, "step": 14161 }, { "epoch": 0.39, "learning_rate": 1.4035235353721524e-05, "loss": 1.3362, "step": 14162 }, { "epoch": 0.39, "learning_rate": 1.4034426041039763e-05, "loss": 1.3494, "step": 14163 }, { "epoch": 0.39, "learning_rate": 1.4033616696794547e-05, "loss": 1.2793, "step": 14164 }, { "epoch": 0.39, "learning_rate": 1.4032807320992215e-05, "loss": 1.5098, "step": 14165 }, { "epoch": 0.39, "learning_rate": 1.403199791363909e-05, "loss": 1.3176, "step": 14166 }, { "epoch": 0.39, "learning_rate": 1.403118847474151e-05, "loss": 1.3164, "step": 14167 }, { "epoch": 0.39, "learning_rate": 1.4030379004305807e-05, "loss": 1.8242, "step": 14168 }, { "epoch": 0.39, "learning_rate": 1.4029569502338316e-05, "loss": 1.2979, "step": 14169 }, { "epoch": 0.39, "learning_rate": 1.4028759968845367e-05, "loss": 1.2017, "step": 14170 }, { "epoch": 0.39, "learning_rate": 1.4027950403833295e-05, "loss": 1.2444, "step": 14171 }, { "epoch": 0.39, "learning_rate": 1.4027140807308433e-05, "loss": 1.1387, "step": 14172 }, { "epoch": 0.39, "learning_rate": 1.4026331179277113e-05, "loss": 1.4065, "step": 14173 }, { "epoch": 0.39, "learning_rate": 1.4025521519745673e-05, "loss": 1.2974, "step": 14174 }, { "epoch": 0.39, "learning_rate": 1.4024711828720445e-05, "loss": 1.1399, "step": 14175 }, { "epoch": 0.39, "learning_rate": 1.4023902106207766e-05, "loss": 1.1526, "step": 14176 }, { "epoch": 0.39, "learning_rate": 1.4023092352213968e-05, "loss": 1.4453, "step": 14177 }, { "epoch": 0.39, "learning_rate": 1.4022282566745387e-05, "loss": 1.3638, "step": 14178 }, { "epoch": 0.39, "learning_rate": 1.4021472749808359e-05, "loss": 1.2712, "step": 14179 }, { "epoch": 0.39, "learning_rate": 1.4020662901409217e-05, "loss": 1.3064, "step": 14180 }, { "epoch": 0.39, "learning_rate": 1.40198530215543e-05, "loss": 1.2542, "step": 14181 }, { "epoch": 0.39, "learning_rate": 1.4019043110249944e-05, "loss": 1.2766, "step": 14182 }, { "epoch": 0.39, "learning_rate": 1.4018233167502484e-05, "loss": 1.2803, "step": 14183 }, { "epoch": 0.39, "learning_rate": 1.4017423193318259e-05, "loss": 1.3303, "step": 14184 }, { "epoch": 0.39, "learning_rate": 1.4016613187703603e-05, "loss": 1.2588, "step": 14185 }, { "epoch": 0.39, "learning_rate": 1.4015803150664853e-05, "loss": 1.3662, "step": 14186 }, { "epoch": 0.39, "learning_rate": 1.4014993082208349e-05, "loss": 1.4121, "step": 14187 }, { "epoch": 0.39, "learning_rate": 1.4014182982340428e-05, "loss": 1.1582, "step": 14188 }, { "epoch": 0.39, "learning_rate": 1.4013372851067423e-05, "loss": 1.407, "step": 14189 }, { "epoch": 0.39, "learning_rate": 1.4012562688395682e-05, "loss": 1.1771, "step": 14190 }, { "epoch": 0.39, "learning_rate": 1.4011752494331532e-05, "loss": 1.2388, "step": 14191 }, { "epoch": 0.39, "learning_rate": 1.401094226888132e-05, "loss": 1.2979, "step": 14192 }, { "epoch": 0.39, "learning_rate": 1.4010132012051379e-05, "loss": 1.251, "step": 14193 }, { "epoch": 0.39, "learning_rate": 1.4009321723848054e-05, "loss": 1.3118, "step": 14194 }, { "epoch": 0.39, "learning_rate": 1.4008511404277679e-05, "loss": 1.3047, "step": 14195 }, { "epoch": 0.39, "learning_rate": 1.4007701053346597e-05, "loss": 1.4722, "step": 14196 }, { "epoch": 0.39, "learning_rate": 1.4006890671061143e-05, "loss": 1.3601, "step": 14197 }, { "epoch": 0.39, "learning_rate": 1.4006080257427663e-05, "loss": 1.3499, "step": 14198 }, { "epoch": 0.39, "learning_rate": 1.4005269812452495e-05, "loss": 1.3945, "step": 14199 }, { "epoch": 0.39, "learning_rate": 1.4004459336141982e-05, "loss": 1.3459, "step": 14200 }, { "epoch": 0.39, "learning_rate": 1.4003648828502459e-05, "loss": 1.3657, "step": 14201 }, { "epoch": 0.39, "learning_rate": 1.4002838289540273e-05, "loss": 1.4446, "step": 14202 }, { "epoch": 0.39, "learning_rate": 1.4002027719261757e-05, "loss": 1.3179, "step": 14203 }, { "epoch": 0.39, "learning_rate": 1.4001217117673265e-05, "loss": 1.4058, "step": 14204 }, { "epoch": 0.39, "learning_rate": 1.4000406484781125e-05, "loss": 1.3625, "step": 14205 }, { "epoch": 0.39, "learning_rate": 1.3999595820591691e-05, "loss": 1.2004, "step": 14206 }, { "epoch": 0.39, "learning_rate": 1.3998785125111297e-05, "loss": 1.342, "step": 14207 }, { "epoch": 0.39, "learning_rate": 1.3997974398346293e-05, "loss": 1.3821, "step": 14208 }, { "epoch": 0.39, "learning_rate": 1.3997163640303012e-05, "loss": 1.2849, "step": 14209 }, { "epoch": 0.39, "learning_rate": 1.3996352850987806e-05, "loss": 1.7959, "step": 14210 }, { "epoch": 0.39, "learning_rate": 1.399554203040701e-05, "loss": 1.3962, "step": 14211 }, { "epoch": 0.39, "learning_rate": 1.3994731178566978e-05, "loss": 1.4258, "step": 14212 }, { "epoch": 0.39, "learning_rate": 1.3993920295474043e-05, "loss": 1.3557, "step": 14213 }, { "epoch": 0.39, "learning_rate": 1.3993109381134553e-05, "loss": 1.3506, "step": 14214 }, { "epoch": 0.39, "learning_rate": 1.3992298435554856e-05, "loss": 1.2856, "step": 14215 }, { "epoch": 0.39, "learning_rate": 1.3991487458741293e-05, "loss": 1.3628, "step": 14216 }, { "epoch": 0.39, "learning_rate": 1.399067645070021e-05, "loss": 1.2458, "step": 14217 }, { "epoch": 0.39, "learning_rate": 1.3989865411437949e-05, "loss": 1.2065, "step": 14218 }, { "epoch": 0.39, "learning_rate": 1.3989054340960857e-05, "loss": 1.2351, "step": 14219 }, { "epoch": 0.39, "learning_rate": 1.3988243239275281e-05, "loss": 1.3096, "step": 14220 }, { "epoch": 0.39, "learning_rate": 1.3987432106387564e-05, "loss": 1.2959, "step": 14221 }, { "epoch": 0.39, "learning_rate": 1.3986620942304054e-05, "loss": 1.2827, "step": 14222 }, { "epoch": 0.39, "learning_rate": 1.3985809747031094e-05, "loss": 1.4153, "step": 14223 }, { "epoch": 0.39, "learning_rate": 1.3984998520575037e-05, "loss": 1.4001, "step": 14224 }, { "epoch": 0.39, "learning_rate": 1.3984187262942222e-05, "loss": 1.2305, "step": 14225 }, { "epoch": 0.39, "learning_rate": 1.3983375974139003e-05, "loss": 1.4312, "step": 14226 }, { "epoch": 0.39, "learning_rate": 1.398256465417172e-05, "loss": 1.3843, "step": 14227 }, { "epoch": 0.39, "learning_rate": 1.3981753303046725e-05, "loss": 1.3413, "step": 14228 }, { "epoch": 0.39, "learning_rate": 1.3980941920770366e-05, "loss": 1.2349, "step": 14229 }, { "epoch": 0.39, "learning_rate": 1.3980130507348985e-05, "loss": 1.3257, "step": 14230 }, { "epoch": 0.39, "learning_rate": 1.397931906278894e-05, "loss": 1.3396, "step": 14231 }, { "epoch": 0.39, "learning_rate": 1.397850758709657e-05, "loss": 1.4468, "step": 14232 }, { "epoch": 0.39, "learning_rate": 1.3977696080278231e-05, "loss": 1.3245, "step": 14233 }, { "epoch": 0.39, "learning_rate": 1.3976884542340266e-05, "loss": 1.3328, "step": 14234 }, { "epoch": 0.39, "learning_rate": 1.3976072973289027e-05, "loss": 1.2932, "step": 14235 }, { "epoch": 0.39, "learning_rate": 1.3975261373130861e-05, "loss": 1.4187, "step": 14236 }, { "epoch": 0.39, "learning_rate": 1.3974449741872123e-05, "loss": 1.2927, "step": 14237 }, { "epoch": 0.39, "learning_rate": 1.3973638079519153e-05, "loss": 1.4382, "step": 14238 }, { "epoch": 0.39, "learning_rate": 1.3972826386078313e-05, "loss": 1.2676, "step": 14239 }, { "epoch": 0.39, "learning_rate": 1.3972014661555947e-05, "loss": 1.4216, "step": 14240 }, { "epoch": 0.39, "learning_rate": 1.3971202905958405e-05, "loss": 1.2273, "step": 14241 }, { "epoch": 0.39, "learning_rate": 1.3970391119292037e-05, "loss": 1.3174, "step": 14242 }, { "epoch": 0.39, "learning_rate": 1.39695793015632e-05, "loss": 1.2759, "step": 14243 }, { "epoch": 0.39, "learning_rate": 1.3968767452778234e-05, "loss": 1.3057, "step": 14244 }, { "epoch": 0.39, "learning_rate": 1.3967955572943503e-05, "loss": 1.303, "step": 14245 }, { "epoch": 0.39, "learning_rate": 1.3967143662065353e-05, "loss": 1.3445, "step": 14246 }, { "epoch": 0.39, "learning_rate": 1.3966331720150134e-05, "loss": 1.4636, "step": 14247 }, { "epoch": 0.39, "learning_rate": 1.3965519747204205e-05, "loss": 1.3201, "step": 14248 }, { "epoch": 0.39, "learning_rate": 1.3964707743233913e-05, "loss": 1.2776, "step": 14249 }, { "epoch": 0.39, "learning_rate": 1.396389570824561e-05, "loss": 1.4341, "step": 14250 }, { "epoch": 0.39, "learning_rate": 1.3963083642245651e-05, "loss": 1.3594, "step": 14251 }, { "epoch": 0.39, "learning_rate": 1.3962271545240391e-05, "loss": 1.2366, "step": 14252 }, { "epoch": 0.39, "learning_rate": 1.3961459417236181e-05, "loss": 1.2615, "step": 14253 }, { "epoch": 0.39, "learning_rate": 1.3960647258239375e-05, "loss": 1.3206, "step": 14254 }, { "epoch": 0.39, "learning_rate": 1.395983506825633e-05, "loss": 1.437, "step": 14255 }, { "epoch": 0.39, "learning_rate": 1.3959022847293393e-05, "loss": 1.4697, "step": 14256 }, { "epoch": 0.39, "learning_rate": 1.3958210595356924e-05, "loss": 1.3635, "step": 14257 }, { "epoch": 0.39, "learning_rate": 1.3957398312453277e-05, "loss": 1.2368, "step": 14258 }, { "epoch": 0.39, "learning_rate": 1.3956585998588807e-05, "loss": 1.3862, "step": 14259 }, { "epoch": 0.39, "learning_rate": 1.3955773653769867e-05, "loss": 1.2961, "step": 14260 }, { "epoch": 0.39, "learning_rate": 1.3954961278002816e-05, "loss": 1.1333, "step": 14261 }, { "epoch": 0.39, "learning_rate": 1.3954148871294006e-05, "loss": 1.3394, "step": 14262 }, { "epoch": 0.39, "learning_rate": 1.3953336433649797e-05, "loss": 1.4395, "step": 14263 }, { "epoch": 0.39, "learning_rate": 1.3952523965076542e-05, "loss": 1.2954, "step": 14264 }, { "epoch": 0.39, "learning_rate": 1.3951711465580598e-05, "loss": 1.395, "step": 14265 }, { "epoch": 0.39, "learning_rate": 1.395089893516832e-05, "loss": 1.3623, "step": 14266 }, { "epoch": 0.39, "learning_rate": 1.395008637384607e-05, "loss": 1.2883, "step": 14267 }, { "epoch": 0.39, "learning_rate": 1.3949273781620198e-05, "loss": 1.2673, "step": 14268 }, { "epoch": 0.39, "learning_rate": 1.3948461158497068e-05, "loss": 1.1949, "step": 14269 }, { "epoch": 0.39, "learning_rate": 1.3947648504483033e-05, "loss": 1.7192, "step": 14270 }, { "epoch": 0.39, "learning_rate": 1.3946835819584452e-05, "loss": 1.2886, "step": 14271 }, { "epoch": 0.39, "learning_rate": 1.3946023103807684e-05, "loss": 1.3149, "step": 14272 }, { "epoch": 0.39, "learning_rate": 1.394521035715909e-05, "loss": 1.3784, "step": 14273 }, { "epoch": 0.39, "learning_rate": 1.3944397579645019e-05, "loss": 1.3076, "step": 14274 }, { "epoch": 0.39, "learning_rate": 1.3943584771271838e-05, "loss": 1.21, "step": 14275 }, { "epoch": 0.39, "learning_rate": 1.394277193204591e-05, "loss": 1.4343, "step": 14276 }, { "epoch": 0.39, "learning_rate": 1.394195906197358e-05, "loss": 1.4377, "step": 14277 }, { "epoch": 0.39, "learning_rate": 1.3941146161061223e-05, "loss": 1.4888, "step": 14278 }, { "epoch": 0.39, "learning_rate": 1.3940333229315186e-05, "loss": 1.1895, "step": 14279 }, { "epoch": 0.39, "learning_rate": 1.393952026674184e-05, "loss": 1.2939, "step": 14280 }, { "epoch": 0.39, "learning_rate": 1.3938707273347536e-05, "loss": 1.4839, "step": 14281 }, { "epoch": 0.39, "learning_rate": 1.3937894249138642e-05, "loss": 1.3103, "step": 14282 }, { "epoch": 0.39, "learning_rate": 1.393708119412151e-05, "loss": 1.4434, "step": 14283 }, { "epoch": 0.39, "learning_rate": 1.3936268108302508e-05, "loss": 1.4055, "step": 14284 }, { "epoch": 0.39, "learning_rate": 1.3935454991687997e-05, "loss": 1.3191, "step": 14285 }, { "epoch": 0.39, "learning_rate": 1.3934641844284338e-05, "loss": 1.3875, "step": 14286 }, { "epoch": 0.39, "learning_rate": 1.3933828666097889e-05, "loss": 1.1663, "step": 14287 }, { "epoch": 0.39, "learning_rate": 1.3933015457135013e-05, "loss": 1.3728, "step": 14288 }, { "epoch": 0.39, "learning_rate": 1.3932202217402076e-05, "loss": 1.376, "step": 14289 }, { "epoch": 0.39, "learning_rate": 1.3931388946905437e-05, "loss": 1.3389, "step": 14290 }, { "epoch": 0.39, "learning_rate": 1.3930575645651457e-05, "loss": 1.7256, "step": 14291 }, { "epoch": 0.39, "learning_rate": 1.3929762313646505e-05, "loss": 1.2493, "step": 14292 }, { "epoch": 0.39, "learning_rate": 1.3928948950896938e-05, "loss": 1.1663, "step": 14293 }, { "epoch": 0.39, "learning_rate": 1.3928135557409125e-05, "loss": 1.3406, "step": 14294 }, { "epoch": 0.39, "learning_rate": 1.3927322133189426e-05, "loss": 1.3813, "step": 14295 }, { "epoch": 0.39, "learning_rate": 1.3926508678244204e-05, "loss": 1.3494, "step": 14296 }, { "epoch": 0.39, "learning_rate": 1.3925695192579824e-05, "loss": 1.2349, "step": 14297 }, { "epoch": 0.39, "learning_rate": 1.3924881676202652e-05, "loss": 1.2761, "step": 14298 }, { "epoch": 0.39, "learning_rate": 1.392406812911905e-05, "loss": 1.8013, "step": 14299 }, { "epoch": 0.39, "learning_rate": 1.3923254551335385e-05, "loss": 1.314, "step": 14300 }, { "epoch": 0.39, "learning_rate": 1.3922440942858022e-05, "loss": 1.479, "step": 14301 }, { "epoch": 0.39, "learning_rate": 1.3921627303693326e-05, "loss": 1.3547, "step": 14302 }, { "epoch": 0.39, "learning_rate": 1.3920813633847661e-05, "loss": 1.4409, "step": 14303 }, { "epoch": 0.39, "learning_rate": 1.3919999933327395e-05, "loss": 1.249, "step": 14304 }, { "epoch": 0.39, "learning_rate": 1.391918620213889e-05, "loss": 1.3364, "step": 14305 }, { "epoch": 0.39, "learning_rate": 1.3918372440288516e-05, "loss": 1.4331, "step": 14306 }, { "epoch": 0.39, "learning_rate": 1.3917558647782638e-05, "loss": 1.0703, "step": 14307 }, { "epoch": 0.39, "learning_rate": 1.3916744824627625e-05, "loss": 1.3315, "step": 14308 }, { "epoch": 0.39, "learning_rate": 1.3915930970829844e-05, "loss": 1.4331, "step": 14309 }, { "epoch": 0.39, "learning_rate": 1.3915117086395658e-05, "loss": 1.3235, "step": 14310 }, { "epoch": 0.39, "learning_rate": 1.3914303171331436e-05, "loss": 1.3735, "step": 14311 }, { "epoch": 0.39, "learning_rate": 1.3913489225643551e-05, "loss": 1.3682, "step": 14312 }, { "epoch": 0.39, "learning_rate": 1.3912675249338361e-05, "loss": 1.3904, "step": 14313 }, { "epoch": 0.39, "learning_rate": 1.3911861242422244e-05, "loss": 1.3945, "step": 14314 }, { "epoch": 0.39, "learning_rate": 1.391104720490156e-05, "loss": 1.3611, "step": 14315 }, { "epoch": 0.39, "learning_rate": 1.3910233136782687e-05, "loss": 1.4785, "step": 14316 }, { "epoch": 0.39, "learning_rate": 1.3909419038071983e-05, "loss": 1.2942, "step": 14317 }, { "epoch": 0.39, "learning_rate": 1.3908604908775827e-05, "loss": 1.2429, "step": 14318 }, { "epoch": 0.39, "learning_rate": 1.3907790748900582e-05, "loss": 1.3857, "step": 14319 }, { "epoch": 0.39, "learning_rate": 1.3906976558452622e-05, "loss": 1.3657, "step": 14320 }, { "epoch": 0.39, "learning_rate": 1.390616233743831e-05, "loss": 1.3879, "step": 14321 }, { "epoch": 0.39, "learning_rate": 1.3905348085864025e-05, "loss": 1.29, "step": 14322 }, { "epoch": 0.39, "learning_rate": 1.3904533803736134e-05, "loss": 1.2083, "step": 14323 }, { "epoch": 0.39, "learning_rate": 1.3903719491061003e-05, "loss": 1.3333, "step": 14324 }, { "epoch": 0.39, "learning_rate": 1.3902905147845007e-05, "loss": 1.2424, "step": 14325 }, { "epoch": 0.39, "learning_rate": 1.390209077409452e-05, "loss": 1.2903, "step": 14326 }, { "epoch": 0.39, "learning_rate": 1.3901276369815906e-05, "loss": 1.2036, "step": 14327 }, { "epoch": 0.39, "learning_rate": 1.3900461935015539e-05, "loss": 1.158, "step": 14328 }, { "epoch": 0.39, "learning_rate": 1.3899647469699795e-05, "loss": 1.4531, "step": 14329 }, { "epoch": 0.39, "learning_rate": 1.3898832973875043e-05, "loss": 1.3147, "step": 14330 }, { "epoch": 0.39, "learning_rate": 1.3898018447547655e-05, "loss": 1.1223, "step": 14331 }, { "epoch": 0.39, "learning_rate": 1.3897203890724e-05, "loss": 1.3237, "step": 14332 }, { "epoch": 0.39, "learning_rate": 1.3896389303410457e-05, "loss": 1.2026, "step": 14333 }, { "epoch": 0.39, "learning_rate": 1.3895574685613396e-05, "loss": 1.3086, "step": 14334 }, { "epoch": 0.39, "learning_rate": 1.3894760037339193e-05, "loss": 1.3367, "step": 14335 }, { "epoch": 0.39, "learning_rate": 1.3893945358594216e-05, "loss": 1.3, "step": 14336 }, { "epoch": 0.39, "learning_rate": 1.389313064938484e-05, "loss": 1.2805, "step": 14337 }, { "epoch": 0.39, "learning_rate": 1.3892315909717443e-05, "loss": 1.1992, "step": 14338 }, { "epoch": 0.39, "learning_rate": 1.3891501139598397e-05, "loss": 1.3, "step": 14339 }, { "epoch": 0.39, "learning_rate": 1.3890686339034074e-05, "loss": 1.3926, "step": 14340 }, { "epoch": 0.39, "learning_rate": 1.3889871508030854e-05, "loss": 1.1816, "step": 14341 }, { "epoch": 0.39, "learning_rate": 1.3889056646595104e-05, "loss": 1.3711, "step": 14342 }, { "epoch": 0.39, "learning_rate": 1.388824175473321e-05, "loss": 1.2036, "step": 14343 }, { "epoch": 0.39, "learning_rate": 1.3887426832451534e-05, "loss": 1.3708, "step": 14344 }, { "epoch": 0.39, "learning_rate": 1.3886611879756461e-05, "loss": 1.3589, "step": 14345 }, { "epoch": 0.39, "learning_rate": 1.3885796896654364e-05, "loss": 1.186, "step": 14346 }, { "epoch": 0.39, "learning_rate": 1.3884981883151623e-05, "loss": 1.3701, "step": 14347 }, { "epoch": 0.39, "learning_rate": 1.3884166839254607e-05, "loss": 1.4375, "step": 14348 }, { "epoch": 0.39, "learning_rate": 1.3883351764969698e-05, "loss": 1.3733, "step": 14349 }, { "epoch": 0.39, "learning_rate": 1.3882536660303267e-05, "loss": 1.3687, "step": 14350 }, { "epoch": 0.39, "learning_rate": 1.38817215252617e-05, "loss": 1.2676, "step": 14351 }, { "epoch": 0.39, "learning_rate": 1.3880906359851364e-05, "loss": 1.7378, "step": 14352 }, { "epoch": 0.39, "learning_rate": 1.3880091164078644e-05, "loss": 1.2744, "step": 14353 }, { "epoch": 0.39, "learning_rate": 1.3879275937949914e-05, "loss": 1.2854, "step": 14354 }, { "epoch": 0.39, "learning_rate": 1.3878460681471557e-05, "loss": 1.3396, "step": 14355 }, { "epoch": 0.39, "learning_rate": 1.3877645394649944e-05, "loss": 1.4639, "step": 14356 }, { "epoch": 0.39, "learning_rate": 1.3876830077491459e-05, "loss": 1.3232, "step": 14357 }, { "epoch": 0.39, "learning_rate": 1.3876014730002476e-05, "loss": 1.2017, "step": 14358 }, { "epoch": 0.39, "learning_rate": 1.3875199352189377e-05, "loss": 1.3845, "step": 14359 }, { "epoch": 0.39, "learning_rate": 1.3874383944058543e-05, "loss": 1.4146, "step": 14360 }, { "epoch": 0.39, "learning_rate": 1.3873568505616348e-05, "loss": 1.2915, "step": 14361 }, { "epoch": 0.39, "learning_rate": 1.3872753036869176e-05, "loss": 1.4084, "step": 14362 }, { "epoch": 0.39, "learning_rate": 1.3871937537823405e-05, "loss": 1.2258, "step": 14363 }, { "epoch": 0.39, "learning_rate": 1.3871122008485415e-05, "loss": 1.2786, "step": 14364 }, { "epoch": 0.39, "learning_rate": 1.3870306448861588e-05, "loss": 1.2288, "step": 14365 }, { "epoch": 0.39, "learning_rate": 1.3869490858958301e-05, "loss": 1.3755, "step": 14366 }, { "epoch": 0.39, "learning_rate": 1.3868675238781939e-05, "loss": 1.2336, "step": 14367 }, { "epoch": 0.39, "learning_rate": 1.3867859588338881e-05, "loss": 1.2104, "step": 14368 }, { "epoch": 0.39, "learning_rate": 1.3867043907635507e-05, "loss": 1.0904, "step": 14369 }, { "epoch": 0.39, "learning_rate": 1.38662281966782e-05, "loss": 1.2683, "step": 14370 }, { "epoch": 0.39, "learning_rate": 1.3865412455473343e-05, "loss": 1.4248, "step": 14371 }, { "epoch": 0.39, "learning_rate": 1.3864596684027313e-05, "loss": 1.3777, "step": 14372 }, { "epoch": 0.39, "learning_rate": 1.3863780882346503e-05, "loss": 1.3762, "step": 14373 }, { "epoch": 0.39, "learning_rate": 1.3862965050437282e-05, "loss": 1.3672, "step": 14374 }, { "epoch": 0.39, "learning_rate": 1.3862149188306042e-05, "loss": 1.2549, "step": 14375 }, { "epoch": 0.39, "learning_rate": 1.386133329595916e-05, "loss": 1.3459, "step": 14376 }, { "epoch": 0.39, "learning_rate": 1.3860517373403027e-05, "loss": 1.2581, "step": 14377 }, { "epoch": 0.39, "learning_rate": 1.3859701420644015e-05, "loss": 1.1404, "step": 14378 }, { "epoch": 0.39, "learning_rate": 1.385888543768852e-05, "loss": 1.2795, "step": 14379 }, { "epoch": 0.39, "learning_rate": 1.3858069424542917e-05, "loss": 1.3577, "step": 14380 }, { "epoch": 0.39, "learning_rate": 1.3857253381213593e-05, "loss": 1.2744, "step": 14381 }, { "epoch": 0.39, "learning_rate": 1.3856437307706934e-05, "loss": 1.2405, "step": 14382 }, { "epoch": 0.39, "learning_rate": 1.3855621204029321e-05, "loss": 1.3408, "step": 14383 }, { "epoch": 0.39, "learning_rate": 1.385480507018714e-05, "loss": 1.363, "step": 14384 }, { "epoch": 0.39, "learning_rate": 1.3853988906186778e-05, "loss": 1.3547, "step": 14385 }, { "epoch": 0.39, "learning_rate": 1.385317271203462e-05, "loss": 1.1741, "step": 14386 }, { "epoch": 0.39, "learning_rate": 1.3852356487737049e-05, "loss": 1.3694, "step": 14387 }, { "epoch": 0.39, "learning_rate": 1.3851540233300454e-05, "loss": 1.3782, "step": 14388 }, { "epoch": 0.39, "learning_rate": 1.3850723948731217e-05, "loss": 1.3477, "step": 14389 }, { "epoch": 0.39, "learning_rate": 1.3849907634035728e-05, "loss": 1.2852, "step": 14390 }, { "epoch": 0.39, "learning_rate": 1.3849091289220374e-05, "loss": 1.2368, "step": 14391 }, { "epoch": 0.39, "learning_rate": 1.3848274914291537e-05, "loss": 1.1521, "step": 14392 }, { "epoch": 0.39, "learning_rate": 1.3847458509255608e-05, "loss": 1.5278, "step": 14393 }, { "epoch": 0.39, "learning_rate": 1.3846642074118973e-05, "loss": 1.4688, "step": 14394 }, { "epoch": 0.39, "learning_rate": 1.3845825608888017e-05, "loss": 1.3376, "step": 14395 }, { "epoch": 0.39, "learning_rate": 1.3845009113569132e-05, "loss": 1.312, "step": 14396 }, { "epoch": 0.39, "learning_rate": 1.3844192588168701e-05, "loss": 1.3267, "step": 14397 }, { "epoch": 0.39, "learning_rate": 1.3843376032693118e-05, "loss": 1.3062, "step": 14398 }, { "epoch": 0.39, "learning_rate": 1.3842559447148764e-05, "loss": 1.3154, "step": 14399 }, { "epoch": 0.39, "learning_rate": 1.3841742831542038e-05, "loss": 1.4014, "step": 14400 }, { "epoch": 0.39, "learning_rate": 1.3840926185879318e-05, "loss": 1.5117, "step": 14401 }, { "epoch": 0.39, "learning_rate": 1.3840109510167002e-05, "loss": 1.0806, "step": 14402 }, { "epoch": 0.39, "learning_rate": 1.383929280441147e-05, "loss": 1.3804, "step": 14403 }, { "epoch": 0.39, "learning_rate": 1.3838476068619117e-05, "loss": 1.2986, "step": 14404 }, { "epoch": 0.39, "learning_rate": 1.3837659302796334e-05, "loss": 1.2534, "step": 14405 }, { "epoch": 0.39, "learning_rate": 1.3836842506949511e-05, "loss": 1.2622, "step": 14406 }, { "epoch": 0.39, "learning_rate": 1.3836025681085032e-05, "loss": 1.2847, "step": 14407 }, { "epoch": 0.39, "learning_rate": 1.3835208825209297e-05, "loss": 1.7954, "step": 14408 }, { "epoch": 0.39, "learning_rate": 1.383439193932869e-05, "loss": 1.1124, "step": 14409 }, { "epoch": 0.39, "learning_rate": 1.3833575023449601e-05, "loss": 1.2424, "step": 14410 }, { "epoch": 0.39, "learning_rate": 1.3832758077578425e-05, "loss": 1.4766, "step": 14411 }, { "epoch": 0.39, "learning_rate": 1.3831941101721553e-05, "loss": 1.7051, "step": 14412 }, { "epoch": 0.39, "learning_rate": 1.3831124095885372e-05, "loss": 1.3098, "step": 14413 }, { "epoch": 0.39, "learning_rate": 1.3830307060076282e-05, "loss": 1.0757, "step": 14414 }, { "epoch": 0.39, "learning_rate": 1.3829489994300667e-05, "loss": 1.2432, "step": 14415 }, { "epoch": 0.39, "learning_rate": 1.3828672898564928e-05, "loss": 1.2234, "step": 14416 }, { "epoch": 0.39, "learning_rate": 1.3827855772875447e-05, "loss": 1.6475, "step": 14417 }, { "epoch": 0.39, "learning_rate": 1.3827038617238628e-05, "loss": 1.342, "step": 14418 }, { "epoch": 0.39, "learning_rate": 1.3826221431660854e-05, "loss": 1.2334, "step": 14419 }, { "epoch": 0.39, "learning_rate": 1.3825404216148526e-05, "loss": 1.2988, "step": 14420 }, { "epoch": 0.39, "learning_rate": 1.3824586970708031e-05, "loss": 1.2434, "step": 14421 }, { "epoch": 0.39, "learning_rate": 1.382376969534577e-05, "loss": 1.447, "step": 14422 }, { "epoch": 0.39, "learning_rate": 1.382295239006813e-05, "loss": 1.3638, "step": 14423 }, { "epoch": 0.39, "learning_rate": 1.382213505488151e-05, "loss": 1.286, "step": 14424 }, { "epoch": 0.39, "learning_rate": 1.38213176897923e-05, "loss": 1.4575, "step": 14425 }, { "epoch": 0.39, "learning_rate": 1.38205002948069e-05, "loss": 1.2043, "step": 14426 }, { "epoch": 0.39, "learning_rate": 1.3819682869931699e-05, "loss": 1.4775, "step": 14427 }, { "epoch": 0.39, "learning_rate": 1.38188654151731e-05, "loss": 1.2595, "step": 14428 }, { "epoch": 0.39, "learning_rate": 1.3818047930537491e-05, "loss": 1.3325, "step": 14429 }, { "epoch": 0.39, "learning_rate": 1.3817230416031268e-05, "loss": 1.2776, "step": 14430 }, { "epoch": 0.39, "learning_rate": 1.3816412871660833e-05, "loss": 1.2659, "step": 14431 }, { "epoch": 0.39, "learning_rate": 1.3815595297432575e-05, "loss": 1.3843, "step": 14432 }, { "epoch": 0.39, "learning_rate": 1.3814777693352899e-05, "loss": 1.2859, "step": 14433 }, { "epoch": 0.39, "learning_rate": 1.3813960059428192e-05, "loss": 1.4761, "step": 14434 }, { "epoch": 0.39, "learning_rate": 1.3813142395664856e-05, "loss": 1.4658, "step": 14435 }, { "epoch": 0.39, "learning_rate": 1.3812324702069285e-05, "loss": 1.1775, "step": 14436 }, { "epoch": 0.39, "learning_rate": 1.3811506978647882e-05, "loss": 1.2078, "step": 14437 }, { "epoch": 0.39, "learning_rate": 1.3810689225407037e-05, "loss": 1.5054, "step": 14438 }, { "epoch": 0.39, "learning_rate": 1.3809871442353155e-05, "loss": 1.3525, "step": 14439 }, { "epoch": 0.39, "learning_rate": 1.3809053629492626e-05, "loss": 1.3745, "step": 14440 }, { "epoch": 0.39, "learning_rate": 1.3808235786831856e-05, "loss": 1.3379, "step": 14441 }, { "epoch": 0.39, "learning_rate": 1.380741791437724e-05, "loss": 1.3481, "step": 14442 }, { "epoch": 0.39, "learning_rate": 1.3806600012135176e-05, "loss": 1.4248, "step": 14443 }, { "epoch": 0.39, "learning_rate": 1.380578208011206e-05, "loss": 1.3896, "step": 14444 }, { "epoch": 0.39, "learning_rate": 1.38049641183143e-05, "loss": 1.2173, "step": 14445 }, { "epoch": 0.39, "learning_rate": 1.3804146126748284e-05, "loss": 1.251, "step": 14446 }, { "epoch": 0.39, "learning_rate": 1.3803328105420422e-05, "loss": 1.3306, "step": 14447 }, { "epoch": 0.39, "learning_rate": 1.3802510054337109e-05, "loss": 1.3516, "step": 14448 }, { "epoch": 0.39, "learning_rate": 1.3801691973504745e-05, "loss": 1.4639, "step": 14449 }, { "epoch": 0.39, "learning_rate": 1.380087386292973e-05, "loss": 1.2874, "step": 14450 }, { "epoch": 0.39, "learning_rate": 1.3800055722618467e-05, "loss": 1.2361, "step": 14451 }, { "epoch": 0.39, "learning_rate": 1.3799237552577354e-05, "loss": 1.1697, "step": 14452 }, { "epoch": 0.39, "learning_rate": 1.3798419352812792e-05, "loss": 1.7803, "step": 14453 }, { "epoch": 0.39, "learning_rate": 1.3797601123331183e-05, "loss": 1.3921, "step": 14454 }, { "epoch": 0.39, "learning_rate": 1.3796782864138929e-05, "loss": 1.2439, "step": 14455 }, { "epoch": 0.39, "learning_rate": 1.3795964575242432e-05, "loss": 1.2971, "step": 14456 }, { "epoch": 0.39, "learning_rate": 1.3795146256648093e-05, "loss": 1.3906, "step": 14457 }, { "epoch": 0.39, "learning_rate": 1.3794327908362313e-05, "loss": 1.2859, "step": 14458 }, { "epoch": 0.39, "learning_rate": 1.3793509530391498e-05, "loss": 1.2751, "step": 14459 }, { "epoch": 0.39, "learning_rate": 1.3792691122742046e-05, "loss": 1.4055, "step": 14460 }, { "epoch": 0.39, "learning_rate": 1.3791872685420363e-05, "loss": 1.2334, "step": 14461 }, { "epoch": 0.39, "learning_rate": 1.379105421843285e-05, "loss": 1.3965, "step": 14462 }, { "epoch": 0.39, "learning_rate": 1.3790235721785914e-05, "loss": 1.5134, "step": 14463 }, { "epoch": 0.4, "learning_rate": 1.3789417195485952e-05, "loss": 1.3843, "step": 14464 }, { "epoch": 0.4, "learning_rate": 1.3788598639539377e-05, "loss": 1.3335, "step": 14465 }, { "epoch": 0.4, "learning_rate": 1.3787780053952584e-05, "loss": 1.3643, "step": 14466 }, { "epoch": 0.4, "learning_rate": 1.3786961438731983e-05, "loss": 1.2144, "step": 14467 }, { "epoch": 0.4, "learning_rate": 1.3786142793883974e-05, "loss": 1.363, "step": 14468 }, { "epoch": 0.4, "learning_rate": 1.3785324119414968e-05, "loss": 1.2656, "step": 14469 }, { "epoch": 0.4, "learning_rate": 1.3784505415331362e-05, "loss": 1.3735, "step": 14470 }, { "epoch": 0.4, "learning_rate": 1.378368668163957e-05, "loss": 1.2156, "step": 14471 }, { "epoch": 0.4, "learning_rate": 1.3782867918345987e-05, "loss": 1.3147, "step": 14472 }, { "epoch": 0.4, "learning_rate": 1.3782049125457028e-05, "loss": 1.2783, "step": 14473 }, { "epoch": 0.4, "learning_rate": 1.3781230302979094e-05, "loss": 1.2305, "step": 14474 }, { "epoch": 0.4, "learning_rate": 1.3780411450918594e-05, "loss": 1.2, "step": 14475 }, { "epoch": 0.4, "learning_rate": 1.377959256928193e-05, "loss": 1.396, "step": 14476 }, { "epoch": 0.4, "learning_rate": 1.377877365807551e-05, "loss": 1.0574, "step": 14477 }, { "epoch": 0.4, "learning_rate": 1.3777954717305743e-05, "loss": 1.2585, "step": 14478 }, { "epoch": 0.4, "learning_rate": 1.3777135746979035e-05, "loss": 1.4143, "step": 14479 }, { "epoch": 0.4, "learning_rate": 1.3776316747101795e-05, "loss": 1.2524, "step": 14480 }, { "epoch": 0.4, "learning_rate": 1.3775497717680426e-05, "loss": 1.4946, "step": 14481 }, { "epoch": 0.4, "learning_rate": 1.3774678658721342e-05, "loss": 1.4185, "step": 14482 }, { "epoch": 0.4, "learning_rate": 1.377385957023094e-05, "loss": 1.3433, "step": 14483 }, { "epoch": 0.4, "learning_rate": 1.3773040452215642e-05, "loss": 1.4187, "step": 14484 }, { "epoch": 0.4, "learning_rate": 1.3772221304681848e-05, "loss": 1.2292, "step": 14485 }, { "epoch": 0.4, "learning_rate": 1.3771402127635965e-05, "loss": 1.2673, "step": 14486 }, { "epoch": 0.4, "learning_rate": 1.377058292108441e-05, "loss": 1.3264, "step": 14487 }, { "epoch": 0.4, "learning_rate": 1.3769763685033583e-05, "loss": 1.4448, "step": 14488 }, { "epoch": 0.4, "learning_rate": 1.3768944419489903e-05, "loss": 1.3242, "step": 14489 }, { "epoch": 0.4, "learning_rate": 1.3768125124459768e-05, "loss": 1.3999, "step": 14490 }, { "epoch": 0.4, "learning_rate": 1.37673057999496e-05, "loss": 1.3689, "step": 14491 }, { "epoch": 0.4, "learning_rate": 1.3766486445965797e-05, "loss": 1.689, "step": 14492 }, { "epoch": 0.4, "learning_rate": 1.3765667062514778e-05, "loss": 1.2979, "step": 14493 }, { "epoch": 0.4, "learning_rate": 1.376484764960295e-05, "loss": 1.2844, "step": 14494 }, { "epoch": 0.4, "learning_rate": 1.3764028207236723e-05, "loss": 1.3108, "step": 14495 }, { "epoch": 0.4, "learning_rate": 1.3763208735422513e-05, "loss": 1.4019, "step": 14496 }, { "epoch": 0.4, "learning_rate": 1.3762389234166726e-05, "loss": 1.3518, "step": 14497 }, { "epoch": 0.4, "learning_rate": 1.3761569703475775e-05, "loss": 1.3291, "step": 14498 }, { "epoch": 0.4, "learning_rate": 1.376075014335607e-05, "loss": 1.2644, "step": 14499 }, { "epoch": 0.4, "learning_rate": 1.3759930553814028e-05, "loss": 1.1929, "step": 14500 }, { "epoch": 0.4, "learning_rate": 1.3759110934856053e-05, "loss": 1.3826, "step": 14501 }, { "epoch": 0.4, "learning_rate": 1.3758291286488563e-05, "loss": 1.3945, "step": 14502 }, { "epoch": 0.4, "learning_rate": 1.375747160871797e-05, "loss": 1.407, "step": 14503 }, { "epoch": 0.4, "learning_rate": 1.3756651901550686e-05, "loss": 1.1514, "step": 14504 }, { "epoch": 0.4, "learning_rate": 1.3755832164993121e-05, "loss": 1.1877, "step": 14505 }, { "epoch": 0.4, "learning_rate": 1.3755012399051696e-05, "loss": 1.3152, "step": 14506 }, { "epoch": 0.4, "learning_rate": 1.3754192603732817e-05, "loss": 1.3293, "step": 14507 }, { "epoch": 0.4, "learning_rate": 1.37533727790429e-05, "loss": 1.2268, "step": 14508 }, { "epoch": 0.4, "learning_rate": 1.375255292498836e-05, "loss": 1.3564, "step": 14509 }, { "epoch": 0.4, "learning_rate": 1.3751733041575612e-05, "loss": 1.3669, "step": 14510 }, { "epoch": 0.4, "learning_rate": 1.3750913128811065e-05, "loss": 1.2759, "step": 14511 }, { "epoch": 0.4, "learning_rate": 1.3750093186701144e-05, "loss": 1.3052, "step": 14512 }, { "epoch": 0.4, "learning_rate": 1.374927321525225e-05, "loss": 1.3506, "step": 14513 }, { "epoch": 0.4, "learning_rate": 1.3748453214470811e-05, "loss": 1.1526, "step": 14514 }, { "epoch": 0.4, "learning_rate": 1.3747633184363234e-05, "loss": 1.3335, "step": 14515 }, { "epoch": 0.4, "learning_rate": 1.3746813124935938e-05, "loss": 1.271, "step": 14516 }, { "epoch": 0.4, "learning_rate": 1.3745993036195337e-05, "loss": 1.3589, "step": 14517 }, { "epoch": 0.4, "learning_rate": 1.3745172918147848e-05, "loss": 1.2988, "step": 14518 }, { "epoch": 0.4, "learning_rate": 1.374435277079989e-05, "loss": 1.2336, "step": 14519 }, { "epoch": 0.4, "learning_rate": 1.3743532594157873e-05, "loss": 1.3635, "step": 14520 }, { "epoch": 0.4, "learning_rate": 1.3742712388228218e-05, "loss": 1.2546, "step": 14521 }, { "epoch": 0.4, "learning_rate": 1.3741892153017345e-05, "loss": 1.3308, "step": 14522 }, { "epoch": 0.4, "learning_rate": 1.3741071888531662e-05, "loss": 1.3237, "step": 14523 }, { "epoch": 0.4, "learning_rate": 1.3740251594777593e-05, "loss": 1.3662, "step": 14524 }, { "epoch": 0.4, "learning_rate": 1.3739431271761557e-05, "loss": 1.3127, "step": 14525 }, { "epoch": 0.4, "learning_rate": 1.3738610919489968e-05, "loss": 1.217, "step": 14526 }, { "epoch": 0.4, "learning_rate": 1.3737790537969243e-05, "loss": 1.3103, "step": 14527 }, { "epoch": 0.4, "learning_rate": 1.3736970127205806e-05, "loss": 1.3376, "step": 14528 }, { "epoch": 0.4, "learning_rate": 1.3736149687206068e-05, "loss": 1.4087, "step": 14529 }, { "epoch": 0.4, "learning_rate": 1.3735329217976456e-05, "loss": 1.3728, "step": 14530 }, { "epoch": 0.4, "learning_rate": 1.3734508719523383e-05, "loss": 1.479, "step": 14531 }, { "epoch": 0.4, "learning_rate": 1.373368819185327e-05, "loss": 1.3208, "step": 14532 }, { "epoch": 0.4, "learning_rate": 1.3732867634972533e-05, "loss": 1.3264, "step": 14533 }, { "epoch": 0.4, "learning_rate": 1.37320470488876e-05, "loss": 1.3647, "step": 14534 }, { "epoch": 0.4, "learning_rate": 1.3731226433604883e-05, "loss": 1.4497, "step": 14535 }, { "epoch": 0.4, "learning_rate": 1.3730405789130807e-05, "loss": 1.2803, "step": 14536 }, { "epoch": 0.4, "learning_rate": 1.3729585115471786e-05, "loss": 1.4033, "step": 14537 }, { "epoch": 0.4, "learning_rate": 1.372876441263425e-05, "loss": 1.2988, "step": 14538 }, { "epoch": 0.4, "learning_rate": 1.3727943680624611e-05, "loss": 1.2854, "step": 14539 }, { "epoch": 0.4, "learning_rate": 1.3727122919449293e-05, "loss": 1.3804, "step": 14540 }, { "epoch": 0.4, "learning_rate": 1.3726302129114721e-05, "loss": 1.3113, "step": 14541 }, { "epoch": 0.4, "learning_rate": 1.3725481309627313e-05, "loss": 1.2332, "step": 14542 }, { "epoch": 0.4, "learning_rate": 1.372466046099349e-05, "loss": 1.5259, "step": 14543 }, { "epoch": 0.4, "learning_rate": 1.3723839583219673e-05, "loss": 1.4526, "step": 14544 }, { "epoch": 0.4, "learning_rate": 1.3723018676312293e-05, "loss": 1.3433, "step": 14545 }, { "epoch": 0.4, "learning_rate": 1.3722197740277759e-05, "loss": 1.272, "step": 14546 }, { "epoch": 0.4, "learning_rate": 1.3721376775122503e-05, "loss": 1.1909, "step": 14547 }, { "epoch": 0.4, "learning_rate": 1.3720555780852942e-05, "loss": 1.4121, "step": 14548 }, { "epoch": 0.4, "learning_rate": 1.3719734757475506e-05, "loss": 1.2839, "step": 14549 }, { "epoch": 0.4, "learning_rate": 1.3718913704996612e-05, "loss": 1.2625, "step": 14550 }, { "epoch": 0.4, "learning_rate": 1.3718092623422688e-05, "loss": 1.2957, "step": 14551 }, { "epoch": 0.4, "learning_rate": 1.3717271512760154e-05, "loss": 1.3538, "step": 14552 }, { "epoch": 0.4, "learning_rate": 1.3716450373015436e-05, "loss": 1.4004, "step": 14553 }, { "epoch": 0.4, "learning_rate": 1.3715629204194955e-05, "loss": 1.3452, "step": 14554 }, { "epoch": 0.4, "learning_rate": 1.3714808006305142e-05, "loss": 1.3218, "step": 14555 }, { "epoch": 0.4, "learning_rate": 1.3713986779352416e-05, "loss": 1.3545, "step": 14556 }, { "epoch": 0.4, "learning_rate": 1.3713165523343207e-05, "loss": 1.2449, "step": 14557 }, { "epoch": 0.4, "learning_rate": 1.3712344238283932e-05, "loss": 1.4609, "step": 14558 }, { "epoch": 0.4, "learning_rate": 1.3711522924181026e-05, "loss": 1.3081, "step": 14559 }, { "epoch": 0.4, "learning_rate": 1.3710701581040909e-05, "loss": 1.3037, "step": 14560 }, { "epoch": 0.4, "learning_rate": 1.3709880208870008e-05, "loss": 1.4045, "step": 14561 }, { "epoch": 0.4, "learning_rate": 1.3709058807674747e-05, "loss": 1.4417, "step": 14562 }, { "epoch": 0.4, "learning_rate": 1.3708237377461556e-05, "loss": 1.2175, "step": 14563 }, { "epoch": 0.4, "learning_rate": 1.3707415918236856e-05, "loss": 1.4221, "step": 14564 }, { "epoch": 0.4, "learning_rate": 1.3706594430007081e-05, "loss": 1.3286, "step": 14565 }, { "epoch": 0.4, "learning_rate": 1.3705772912778652e-05, "loss": 1.3181, "step": 14566 }, { "epoch": 0.4, "learning_rate": 1.3704951366558e-05, "loss": 1.3777, "step": 14567 }, { "epoch": 0.4, "learning_rate": 1.3704129791351548e-05, "loss": 1.3767, "step": 14568 }, { "epoch": 0.4, "learning_rate": 1.370330818716573e-05, "loss": 1.2605, "step": 14569 }, { "epoch": 0.4, "learning_rate": 1.3702486554006964e-05, "loss": 1.1929, "step": 14570 }, { "epoch": 0.4, "learning_rate": 1.370166489188169e-05, "loss": 1.3594, "step": 14571 }, { "epoch": 0.4, "learning_rate": 1.3700843200796328e-05, "loss": 1.3208, "step": 14572 }, { "epoch": 0.4, "learning_rate": 1.370002148075731e-05, "loss": 1.2485, "step": 14573 }, { "epoch": 0.4, "learning_rate": 1.3699199731771065e-05, "loss": 1.3284, "step": 14574 }, { "epoch": 0.4, "learning_rate": 1.369837795384402e-05, "loss": 1.2915, "step": 14575 }, { "epoch": 0.4, "learning_rate": 1.3697556146982602e-05, "loss": 1.2976, "step": 14576 }, { "epoch": 0.4, "learning_rate": 1.3696734311193247e-05, "loss": 1.2659, "step": 14577 }, { "epoch": 0.4, "learning_rate": 1.369591244648238e-05, "loss": 1.3206, "step": 14578 }, { "epoch": 0.4, "learning_rate": 1.369509055285643e-05, "loss": 1.4468, "step": 14579 }, { "epoch": 0.4, "learning_rate": 1.3694268630321832e-05, "loss": 1.4556, "step": 14580 }, { "epoch": 0.4, "learning_rate": 1.3693446678885014e-05, "loss": 1.4126, "step": 14581 }, { "epoch": 0.4, "learning_rate": 1.3692624698552404e-05, "loss": 1.2039, "step": 14582 }, { "epoch": 0.4, "learning_rate": 1.3691802689330436e-05, "loss": 1.3311, "step": 14583 }, { "epoch": 0.4, "learning_rate": 1.3690980651225539e-05, "loss": 1.3911, "step": 14584 }, { "epoch": 0.4, "learning_rate": 1.3690158584244141e-05, "loss": 1.0369, "step": 14585 }, { "epoch": 0.4, "learning_rate": 1.3689336488392683e-05, "loss": 1.4224, "step": 14586 }, { "epoch": 0.4, "learning_rate": 1.368851436367759e-05, "loss": 1.3699, "step": 14587 }, { "epoch": 0.4, "learning_rate": 1.3687692210105295e-05, "loss": 1.4106, "step": 14588 }, { "epoch": 0.4, "learning_rate": 1.3686870027682228e-05, "loss": 1.394, "step": 14589 }, { "epoch": 0.4, "learning_rate": 1.3686047816414826e-05, "loss": 1.4297, "step": 14590 }, { "epoch": 0.4, "learning_rate": 1.368522557630952e-05, "loss": 1.2055, "step": 14591 }, { "epoch": 0.4, "learning_rate": 1.3684403307372743e-05, "loss": 1.3223, "step": 14592 }, { "epoch": 0.4, "learning_rate": 1.3683581009610922e-05, "loss": 1.2263, "step": 14593 }, { "epoch": 0.4, "learning_rate": 1.36827586830305e-05, "loss": 1.3025, "step": 14594 }, { "epoch": 0.4, "learning_rate": 1.3681936327637901e-05, "loss": 1.2908, "step": 14595 }, { "epoch": 0.4, "learning_rate": 1.3681113943439568e-05, "loss": 1.3638, "step": 14596 }, { "epoch": 0.4, "learning_rate": 1.3680291530441929e-05, "loss": 1.3311, "step": 14597 }, { "epoch": 0.4, "learning_rate": 1.367946908865142e-05, "loss": 1.2783, "step": 14598 }, { "epoch": 0.4, "learning_rate": 1.3678646618074474e-05, "loss": 1.3628, "step": 14599 }, { "epoch": 0.4, "learning_rate": 1.3677824118717526e-05, "loss": 1.2253, "step": 14600 }, { "epoch": 0.4, "learning_rate": 1.3677001590587011e-05, "loss": 1.249, "step": 14601 }, { "epoch": 0.4, "learning_rate": 1.3676179033689367e-05, "loss": 1.2339, "step": 14602 }, { "epoch": 0.4, "learning_rate": 1.3675356448031028e-05, "loss": 1.3259, "step": 14603 }, { "epoch": 0.4, "learning_rate": 1.3674533833618427e-05, "loss": 1.2549, "step": 14604 }, { "epoch": 0.4, "learning_rate": 1.3673711190457999e-05, "loss": 1.3394, "step": 14605 }, { "epoch": 0.4, "learning_rate": 1.3672888518556184e-05, "loss": 1.342, "step": 14606 }, { "epoch": 0.4, "learning_rate": 1.3672065817919417e-05, "loss": 1.2188, "step": 14607 }, { "epoch": 0.4, "learning_rate": 1.3671243088554133e-05, "loss": 1.2039, "step": 14608 }, { "epoch": 0.4, "learning_rate": 1.3670420330466769e-05, "loss": 1.3098, "step": 14609 }, { "epoch": 0.4, "learning_rate": 1.3669597543663764e-05, "loss": 1.3894, "step": 14610 }, { "epoch": 0.4, "learning_rate": 1.3668774728151552e-05, "loss": 1.3428, "step": 14611 }, { "epoch": 0.4, "learning_rate": 1.3667951883936571e-05, "loss": 1.3704, "step": 14612 }, { "epoch": 0.4, "learning_rate": 1.3667129011025261e-05, "loss": 1.386, "step": 14613 }, { "epoch": 0.4, "learning_rate": 1.366630610942406e-05, "loss": 1.3831, "step": 14614 }, { "epoch": 0.4, "learning_rate": 1.3665483179139398e-05, "loss": 1.3093, "step": 14615 }, { "epoch": 0.4, "learning_rate": 1.3664660220177723e-05, "loss": 1.3921, "step": 14616 }, { "epoch": 0.4, "learning_rate": 1.3663837232545468e-05, "loss": 1.2263, "step": 14617 }, { "epoch": 0.4, "learning_rate": 1.3663014216249074e-05, "loss": 1.2869, "step": 14618 }, { "epoch": 0.4, "learning_rate": 1.3662191171294978e-05, "loss": 1.2961, "step": 14619 }, { "epoch": 0.4, "learning_rate": 1.3661368097689625e-05, "loss": 1.3347, "step": 14620 }, { "epoch": 0.4, "learning_rate": 1.3660544995439446e-05, "loss": 1.1982, "step": 14621 }, { "epoch": 0.4, "learning_rate": 1.3659721864550886e-05, "loss": 1.3472, "step": 14622 }, { "epoch": 0.4, "learning_rate": 1.3658898705030381e-05, "loss": 1.3591, "step": 14623 }, { "epoch": 0.4, "learning_rate": 1.3658075516884376e-05, "loss": 1.3533, "step": 14624 }, { "epoch": 0.4, "learning_rate": 1.3657252300119304e-05, "loss": 1.396, "step": 14625 }, { "epoch": 0.4, "learning_rate": 1.3656429054741613e-05, "loss": 1.2024, "step": 14626 }, { "epoch": 0.4, "learning_rate": 1.3655605780757739e-05, "loss": 1.2117, "step": 14627 }, { "epoch": 0.4, "learning_rate": 1.3654782478174127e-05, "loss": 1.2073, "step": 14628 }, { "epoch": 0.4, "learning_rate": 1.3653959146997213e-05, "loss": 1.439, "step": 14629 }, { "epoch": 0.4, "learning_rate": 1.3653135787233443e-05, "loss": 1.48, "step": 14630 }, { "epoch": 0.4, "learning_rate": 1.3652312398889254e-05, "loss": 1.2988, "step": 14631 }, { "epoch": 0.4, "learning_rate": 1.3651488981971088e-05, "loss": 1.2964, "step": 14632 }, { "epoch": 0.4, "learning_rate": 1.3650665536485392e-05, "loss": 1.2576, "step": 14633 }, { "epoch": 0.4, "learning_rate": 1.3649842062438608e-05, "loss": 1.4399, "step": 14634 }, { "epoch": 0.4, "learning_rate": 1.3649018559837172e-05, "loss": 1.2554, "step": 14635 }, { "epoch": 0.4, "learning_rate": 1.3648195028687534e-05, "loss": 1.2471, "step": 14636 }, { "epoch": 0.4, "learning_rate": 1.364737146899613e-05, "loss": 1.3518, "step": 14637 }, { "epoch": 0.4, "learning_rate": 1.364654788076941e-05, "loss": 1.2554, "step": 14638 }, { "epoch": 0.4, "learning_rate": 1.3645724264013813e-05, "loss": 1.303, "step": 14639 }, { "epoch": 0.4, "learning_rate": 1.3644900618735783e-05, "loss": 1.3652, "step": 14640 }, { "epoch": 0.4, "learning_rate": 1.3644076944941767e-05, "loss": 1.2759, "step": 14641 }, { "epoch": 0.4, "learning_rate": 1.3643253242638204e-05, "loss": 1.2144, "step": 14642 }, { "epoch": 0.4, "learning_rate": 1.3642429511831542e-05, "loss": 1.3752, "step": 14643 }, { "epoch": 0.4, "learning_rate": 1.3641605752528225e-05, "loss": 1.2449, "step": 14644 }, { "epoch": 0.4, "learning_rate": 1.3640781964734694e-05, "loss": 1.303, "step": 14645 }, { "epoch": 0.4, "learning_rate": 1.36399581484574e-05, "loss": 1.2556, "step": 14646 }, { "epoch": 0.4, "learning_rate": 1.3639134303702783e-05, "loss": 1.2878, "step": 14647 }, { "epoch": 0.4, "learning_rate": 1.3638310430477289e-05, "loss": 1.2341, "step": 14648 }, { "epoch": 0.4, "learning_rate": 1.363748652878737e-05, "loss": 1.4119, "step": 14649 }, { "epoch": 0.4, "learning_rate": 1.3636662598639464e-05, "loss": 1.2246, "step": 14650 }, { "epoch": 0.4, "learning_rate": 1.363583864004002e-05, "loss": 1.7329, "step": 14651 }, { "epoch": 0.4, "learning_rate": 1.3635014652995482e-05, "loss": 1.2144, "step": 14652 }, { "epoch": 0.4, "learning_rate": 1.36341906375123e-05, "loss": 1.5122, "step": 14653 }, { "epoch": 0.4, "learning_rate": 1.3633366593596921e-05, "loss": 1.3445, "step": 14654 }, { "epoch": 0.4, "learning_rate": 1.3632542521255792e-05, "loss": 1.5605, "step": 14655 }, { "epoch": 0.4, "learning_rate": 1.3631718420495354e-05, "loss": 1.3577, "step": 14656 }, { "epoch": 0.4, "learning_rate": 1.3630894291322063e-05, "loss": 1.2378, "step": 14657 }, { "epoch": 0.4, "learning_rate": 1.3630070133742358e-05, "loss": 1.3428, "step": 14658 }, { "epoch": 0.4, "learning_rate": 1.3629245947762695e-05, "loss": 1.3157, "step": 14659 }, { "epoch": 0.4, "learning_rate": 1.3628421733389516e-05, "loss": 1.3562, "step": 14660 }, { "epoch": 0.4, "learning_rate": 1.3627597490629274e-05, "loss": 1.4038, "step": 14661 }, { "epoch": 0.4, "learning_rate": 1.3626773219488411e-05, "loss": 1.3315, "step": 14662 }, { "epoch": 0.4, "learning_rate": 1.3625948919973383e-05, "loss": 1.4722, "step": 14663 }, { "epoch": 0.4, "learning_rate": 1.3625124592090633e-05, "loss": 1.272, "step": 14664 }, { "epoch": 0.4, "learning_rate": 1.3624300235846616e-05, "loss": 1.2605, "step": 14665 }, { "epoch": 0.4, "learning_rate": 1.3623475851247776e-05, "loss": 1.3896, "step": 14666 }, { "epoch": 0.4, "learning_rate": 1.3622651438300567e-05, "loss": 1.2803, "step": 14667 }, { "epoch": 0.4, "learning_rate": 1.3621826997011433e-05, "loss": 1.3242, "step": 14668 }, { "epoch": 0.4, "learning_rate": 1.3621002527386832e-05, "loss": 1.2456, "step": 14669 }, { "epoch": 0.4, "learning_rate": 1.3620178029433206e-05, "loss": 1.3472, "step": 14670 }, { "epoch": 0.4, "learning_rate": 1.3619353503157014e-05, "loss": 1.1201, "step": 14671 }, { "epoch": 0.4, "learning_rate": 1.3618528948564698e-05, "loss": 1.2424, "step": 14672 }, { "epoch": 0.4, "learning_rate": 1.3617704365662717e-05, "loss": 1.2915, "step": 14673 }, { "epoch": 0.4, "learning_rate": 1.3616879754457516e-05, "loss": 1.3184, "step": 14674 }, { "epoch": 0.4, "learning_rate": 1.361605511495555e-05, "loss": 1.2661, "step": 14675 }, { "epoch": 0.4, "learning_rate": 1.3615230447163264e-05, "loss": 1.1843, "step": 14676 }, { "epoch": 0.4, "learning_rate": 1.3614405751087118e-05, "loss": 1.2581, "step": 14677 }, { "epoch": 0.4, "learning_rate": 1.3613581026733562e-05, "loss": 1.2222, "step": 14678 }, { "epoch": 0.4, "learning_rate": 1.3612756274109046e-05, "loss": 1.3162, "step": 14679 }, { "epoch": 0.4, "learning_rate": 1.3611931493220025e-05, "loss": 1.3113, "step": 14680 }, { "epoch": 0.4, "learning_rate": 1.361110668407295e-05, "loss": 1.3455, "step": 14681 }, { "epoch": 0.4, "learning_rate": 1.3610281846674273e-05, "loss": 1.332, "step": 14682 }, { "epoch": 0.4, "learning_rate": 1.3609456981030451e-05, "loss": 1.3599, "step": 14683 }, { "epoch": 0.4, "learning_rate": 1.3608632087147933e-05, "loss": 1.4431, "step": 14684 }, { "epoch": 0.4, "learning_rate": 1.3607807165033178e-05, "loss": 1.3684, "step": 14685 }, { "epoch": 0.4, "learning_rate": 1.3606982214692633e-05, "loss": 1.4365, "step": 14686 }, { "epoch": 0.4, "learning_rate": 1.3606157236132756e-05, "loss": 1.3691, "step": 14687 }, { "epoch": 0.4, "learning_rate": 1.3605332229359997e-05, "loss": 1.3125, "step": 14688 }, { "epoch": 0.4, "learning_rate": 1.360450719438082e-05, "loss": 1.377, "step": 14689 }, { "epoch": 0.4, "learning_rate": 1.360368213120167e-05, "loss": 1.3013, "step": 14690 }, { "epoch": 0.4, "learning_rate": 1.3602857039829008e-05, "loss": 1.2714, "step": 14691 }, { "epoch": 0.4, "learning_rate": 1.3602031920269284e-05, "loss": 1.3311, "step": 14692 }, { "epoch": 0.4, "learning_rate": 1.3601206772528958e-05, "loss": 1.3779, "step": 14693 }, { "epoch": 0.4, "learning_rate": 1.3600381596614483e-05, "loss": 1.3574, "step": 14694 }, { "epoch": 0.4, "learning_rate": 1.3599556392532314e-05, "loss": 1.2905, "step": 14695 }, { "epoch": 0.4, "learning_rate": 1.3598731160288909e-05, "loss": 1.3962, "step": 14696 }, { "epoch": 0.4, "learning_rate": 1.3597905899890725e-05, "loss": 1.3491, "step": 14697 }, { "epoch": 0.4, "learning_rate": 1.3597080611344216e-05, "loss": 1.3809, "step": 14698 }, { "epoch": 0.4, "learning_rate": 1.359625529465584e-05, "loss": 1.4436, "step": 14699 }, { "epoch": 0.4, "learning_rate": 1.3595429949832055e-05, "loss": 1.3899, "step": 14700 }, { "epoch": 0.4, "learning_rate": 1.3594604576879315e-05, "loss": 1.3496, "step": 14701 }, { "epoch": 0.4, "learning_rate": 1.359377917580408e-05, "loss": 1.209, "step": 14702 }, { "epoch": 0.4, "learning_rate": 1.3592953746612807e-05, "loss": 1.2959, "step": 14703 }, { "epoch": 0.4, "learning_rate": 1.3592128289311952e-05, "loss": 1.3489, "step": 14704 }, { "epoch": 0.4, "learning_rate": 1.3591302803907976e-05, "loss": 1.3516, "step": 14705 }, { "epoch": 0.4, "learning_rate": 1.3590477290407335e-05, "loss": 1.3232, "step": 14706 }, { "epoch": 0.4, "learning_rate": 1.3589651748816488e-05, "loss": 1.2627, "step": 14707 }, { "epoch": 0.4, "learning_rate": 1.3588826179141894e-05, "loss": 1.2559, "step": 14708 }, { "epoch": 0.4, "learning_rate": 1.358800058139001e-05, "loss": 1.3567, "step": 14709 }, { "epoch": 0.4, "learning_rate": 1.3587174955567295e-05, "loss": 1.1702, "step": 14710 }, { "epoch": 0.4, "learning_rate": 1.3586349301680213e-05, "loss": 1.2979, "step": 14711 }, { "epoch": 0.4, "learning_rate": 1.3585523619735222e-05, "loss": 1.3477, "step": 14712 }, { "epoch": 0.4, "learning_rate": 1.3584697909738775e-05, "loss": 1.1155, "step": 14713 }, { "epoch": 0.4, "learning_rate": 1.3583872171697343e-05, "loss": 1.3469, "step": 14714 }, { "epoch": 0.4, "learning_rate": 1.3583046405617378e-05, "loss": 1.4758, "step": 14715 }, { "epoch": 0.4, "learning_rate": 1.3582220611505343e-05, "loss": 1.752, "step": 14716 }, { "epoch": 0.4, "learning_rate": 1.3581394789367697e-05, "loss": 1.2754, "step": 14717 }, { "epoch": 0.4, "learning_rate": 1.3580568939210905e-05, "loss": 1.3643, "step": 14718 }, { "epoch": 0.4, "learning_rate": 1.3579743061041422e-05, "loss": 1.2739, "step": 14719 }, { "epoch": 0.4, "learning_rate": 1.3578917154865717e-05, "loss": 1.2295, "step": 14720 }, { "epoch": 0.4, "learning_rate": 1.3578091220690243e-05, "loss": 1.301, "step": 14721 }, { "epoch": 0.4, "learning_rate": 1.3577265258521468e-05, "loss": 1.6306, "step": 14722 }, { "epoch": 0.4, "learning_rate": 1.3576439268365848e-05, "loss": 1.3315, "step": 14723 }, { "epoch": 0.4, "learning_rate": 1.3575613250229855e-05, "loss": 1.3772, "step": 14724 }, { "epoch": 0.4, "learning_rate": 1.357478720411994e-05, "loss": 1.2148, "step": 14725 }, { "epoch": 0.4, "learning_rate": 1.3573961130042572e-05, "loss": 1.6958, "step": 14726 }, { "epoch": 0.4, "learning_rate": 1.3573135028004213e-05, "loss": 1.2319, "step": 14727 }, { "epoch": 0.4, "learning_rate": 1.3572308898011328e-05, "loss": 1.2144, "step": 14728 }, { "epoch": 0.4, "learning_rate": 1.3571482740070377e-05, "loss": 1.3284, "step": 14729 }, { "epoch": 0.4, "learning_rate": 1.3570656554187825e-05, "loss": 1.366, "step": 14730 }, { "epoch": 0.4, "learning_rate": 1.3569830340370134e-05, "loss": 1.1968, "step": 14731 }, { "epoch": 0.4, "learning_rate": 1.356900409862377e-05, "loss": 1.2051, "step": 14732 }, { "epoch": 0.4, "learning_rate": 1.3568177828955193e-05, "loss": 1.3999, "step": 14733 }, { "epoch": 0.4, "learning_rate": 1.3567351531370875e-05, "loss": 1.251, "step": 14734 }, { "epoch": 0.4, "learning_rate": 1.3566525205877275e-05, "loss": 1.4182, "step": 14735 }, { "epoch": 0.4, "learning_rate": 1.3565698852480857e-05, "loss": 1.2498, "step": 14736 }, { "epoch": 0.4, "learning_rate": 1.3564872471188089e-05, "loss": 1.3074, "step": 14737 }, { "epoch": 0.4, "learning_rate": 1.3564046062005436e-05, "loss": 1.3271, "step": 14738 }, { "epoch": 0.4, "learning_rate": 1.3563219624939361e-05, "loss": 1.2664, "step": 14739 }, { "epoch": 0.4, "learning_rate": 1.3562393159996333e-05, "loss": 1.3232, "step": 14740 }, { "epoch": 0.4, "learning_rate": 1.3561566667182812e-05, "loss": 1.1851, "step": 14741 }, { "epoch": 0.4, "learning_rate": 1.3560740146505271e-05, "loss": 1.3049, "step": 14742 }, { "epoch": 0.4, "learning_rate": 1.3559913597970176e-05, "loss": 1.2588, "step": 14743 }, { "epoch": 0.4, "learning_rate": 1.3559087021583985e-05, "loss": 1.252, "step": 14744 }, { "epoch": 0.4, "learning_rate": 1.3558260417353178e-05, "loss": 1.4375, "step": 14745 }, { "epoch": 0.4, "learning_rate": 1.3557433785284208e-05, "loss": 1.4243, "step": 14746 }, { "epoch": 0.4, "learning_rate": 1.3556607125383554e-05, "loss": 1.3728, "step": 14747 }, { "epoch": 0.4, "learning_rate": 1.3555780437657675e-05, "loss": 1.2112, "step": 14748 }, { "epoch": 0.4, "learning_rate": 1.3554953722113043e-05, "loss": 1.1865, "step": 14749 }, { "epoch": 0.4, "learning_rate": 1.3554126978756124e-05, "loss": 1.2292, "step": 14750 }, { "epoch": 0.4, "learning_rate": 1.3553300207593387e-05, "loss": 1.1636, "step": 14751 }, { "epoch": 0.4, "learning_rate": 1.3552473408631302e-05, "loss": 1.3342, "step": 14752 }, { "epoch": 0.4, "learning_rate": 1.3551646581876332e-05, "loss": 1.3052, "step": 14753 }, { "epoch": 0.4, "learning_rate": 1.3550819727334953e-05, "loss": 1.4326, "step": 14754 }, { "epoch": 0.4, "learning_rate": 1.3549992845013628e-05, "loss": 1.2441, "step": 14755 }, { "epoch": 0.4, "learning_rate": 1.354916593491883e-05, "loss": 1.25, "step": 14756 }, { "epoch": 0.4, "learning_rate": 1.3548338997057025e-05, "loss": 1.4814, "step": 14757 }, { "epoch": 0.4, "learning_rate": 1.3547512031434683e-05, "loss": 1.3059, "step": 14758 }, { "epoch": 0.4, "learning_rate": 1.3546685038058279e-05, "loss": 1.2124, "step": 14759 }, { "epoch": 0.4, "learning_rate": 1.3545858016934274e-05, "loss": 1.2295, "step": 14760 }, { "epoch": 0.4, "learning_rate": 1.3545030968069148e-05, "loss": 1.4509, "step": 14761 }, { "epoch": 0.4, "learning_rate": 1.3544203891469366e-05, "loss": 1.1882, "step": 14762 }, { "epoch": 0.4, "learning_rate": 1.3543376787141398e-05, "loss": 1.1584, "step": 14763 }, { "epoch": 0.4, "learning_rate": 1.3542549655091714e-05, "loss": 1.2993, "step": 14764 }, { "epoch": 0.4, "learning_rate": 1.3541722495326792e-05, "loss": 1.3853, "step": 14765 }, { "epoch": 0.4, "learning_rate": 1.3540895307853095e-05, "loss": 1.4272, "step": 14766 }, { "epoch": 0.4, "learning_rate": 1.35400680926771e-05, "loss": 1.2549, "step": 14767 }, { "epoch": 0.4, "learning_rate": 1.3539240849805278e-05, "loss": 1.3188, "step": 14768 }, { "epoch": 0.4, "learning_rate": 1.3538413579244099e-05, "loss": 1.2061, "step": 14769 }, { "epoch": 0.4, "learning_rate": 1.3537586281000032e-05, "loss": 1.3181, "step": 14770 }, { "epoch": 0.4, "learning_rate": 1.353675895507956e-05, "loss": 1.3345, "step": 14771 }, { "epoch": 0.4, "learning_rate": 1.3535931601489141e-05, "loss": 1.3464, "step": 14772 }, { "epoch": 0.4, "learning_rate": 1.3535104220235262e-05, "loss": 1.4619, "step": 14773 }, { "epoch": 0.4, "learning_rate": 1.3534276811324387e-05, "loss": 1.3896, "step": 14774 }, { "epoch": 0.4, "learning_rate": 1.3533449374762994e-05, "loss": 1.3801, "step": 14775 }, { "epoch": 0.4, "learning_rate": 1.3532621910557556e-05, "loss": 1.4224, "step": 14776 }, { "epoch": 0.4, "learning_rate": 1.3531794418714544e-05, "loss": 1.27, "step": 14777 }, { "epoch": 0.4, "learning_rate": 1.3530966899240431e-05, "loss": 1.2566, "step": 14778 }, { "epoch": 0.4, "learning_rate": 1.3530139352141696e-05, "loss": 1.3936, "step": 14779 }, { "epoch": 0.4, "learning_rate": 1.3529311777424809e-05, "loss": 1.4243, "step": 14780 }, { "epoch": 0.4, "learning_rate": 1.3528484175096248e-05, "loss": 1.2141, "step": 14781 }, { "epoch": 0.4, "learning_rate": 1.3527656545162484e-05, "loss": 1.8169, "step": 14782 }, { "epoch": 0.4, "learning_rate": 1.3526828887629997e-05, "loss": 1.4131, "step": 14783 }, { "epoch": 0.4, "learning_rate": 1.3526001202505257e-05, "loss": 1.1917, "step": 14784 }, { "epoch": 0.4, "learning_rate": 1.3525173489794743e-05, "loss": 1.2681, "step": 14785 }, { "epoch": 0.4, "learning_rate": 1.3524345749504928e-05, "loss": 1.0999, "step": 14786 }, { "epoch": 0.4, "learning_rate": 1.3523517981642287e-05, "loss": 1.3987, "step": 14787 }, { "epoch": 0.4, "learning_rate": 1.3522690186213301e-05, "loss": 1.2488, "step": 14788 }, { "epoch": 0.4, "learning_rate": 1.3521862363224443e-05, "loss": 1.1917, "step": 14789 }, { "epoch": 0.4, "learning_rate": 1.352103451268219e-05, "loss": 1.2524, "step": 14790 }, { "epoch": 0.4, "learning_rate": 1.3520206634593018e-05, "loss": 1.7393, "step": 14791 }, { "epoch": 0.4, "learning_rate": 1.3519378728963406e-05, "loss": 1.3879, "step": 14792 }, { "epoch": 0.4, "learning_rate": 1.351855079579983e-05, "loss": 1.3218, "step": 14793 }, { "epoch": 0.4, "learning_rate": 1.3517722835108764e-05, "loss": 1.2837, "step": 14794 }, { "epoch": 0.4, "learning_rate": 1.3516894846896693e-05, "loss": 1.2527, "step": 14795 }, { "epoch": 0.4, "learning_rate": 1.3516066831170086e-05, "loss": 1.4897, "step": 14796 }, { "epoch": 0.4, "learning_rate": 1.351523878793543e-05, "loss": 1.3474, "step": 14797 }, { "epoch": 0.4, "learning_rate": 1.3514410717199196e-05, "loss": 1.2212, "step": 14798 }, { "epoch": 0.4, "learning_rate": 1.3513582618967867e-05, "loss": 1.355, "step": 14799 }, { "epoch": 0.4, "learning_rate": 1.3512754493247917e-05, "loss": 1.3835, "step": 14800 }, { "epoch": 0.4, "learning_rate": 1.3511926340045828e-05, "loss": 1.3254, "step": 14801 }, { "epoch": 0.4, "learning_rate": 1.3511098159368081e-05, "loss": 1.5264, "step": 14802 }, { "epoch": 0.4, "learning_rate": 1.3510269951221151e-05, "loss": 1.3513, "step": 14803 }, { "epoch": 0.4, "learning_rate": 1.3509441715611522e-05, "loss": 1.3652, "step": 14804 }, { "epoch": 0.4, "learning_rate": 1.3508613452545669e-05, "loss": 1.5332, "step": 14805 }, { "epoch": 0.4, "learning_rate": 1.3507785162030076e-05, "loss": 1.2458, "step": 14806 }, { "epoch": 0.4, "learning_rate": 1.3506956844071218e-05, "loss": 1.2395, "step": 14807 }, { "epoch": 0.4, "learning_rate": 1.3506128498675583e-05, "loss": 1.417, "step": 14808 }, { "epoch": 0.4, "learning_rate": 1.3505300125849642e-05, "loss": 1.3022, "step": 14809 }, { "epoch": 0.4, "learning_rate": 1.3504471725599888e-05, "loss": 1.1807, "step": 14810 }, { "epoch": 0.4, "learning_rate": 1.3503643297932789e-05, "loss": 1.3306, "step": 14811 }, { "epoch": 0.4, "learning_rate": 1.3502814842854837e-05, "loss": 1.2292, "step": 14812 }, { "epoch": 0.4, "learning_rate": 1.3501986360372507e-05, "loss": 1.3931, "step": 14813 }, { "epoch": 0.4, "learning_rate": 1.3501157850492283e-05, "loss": 1.4319, "step": 14814 }, { "epoch": 0.4, "learning_rate": 1.3500329313220645e-05, "loss": 1.3391, "step": 14815 }, { "epoch": 0.4, "learning_rate": 1.3499500748564078e-05, "loss": 1.4521, "step": 14816 }, { "epoch": 0.4, "learning_rate": 1.349867215652906e-05, "loss": 1.3472, "step": 14817 }, { "epoch": 0.4, "learning_rate": 1.3497843537122077e-05, "loss": 1.3398, "step": 14818 }, { "epoch": 0.4, "learning_rate": 1.349701489034961e-05, "loss": 1.7817, "step": 14819 }, { "epoch": 0.4, "learning_rate": 1.3496186216218148e-05, "loss": 1.2539, "step": 14820 }, { "epoch": 0.4, "learning_rate": 1.3495357514734164e-05, "loss": 1.079, "step": 14821 }, { "epoch": 0.4, "learning_rate": 1.349452878590415e-05, "loss": 1.3198, "step": 14822 }, { "epoch": 0.4, "learning_rate": 1.3493700029734584e-05, "loss": 1.2908, "step": 14823 }, { "epoch": 0.4, "learning_rate": 1.3492871246231954e-05, "loss": 1.3469, "step": 14824 }, { "epoch": 0.4, "learning_rate": 1.3492042435402737e-05, "loss": 1.3528, "step": 14825 }, { "epoch": 0.4, "learning_rate": 1.3491213597253427e-05, "loss": 1.491, "step": 14826 }, { "epoch": 0.4, "learning_rate": 1.34903847317905e-05, "loss": 1.3157, "step": 14827 }, { "epoch": 0.4, "learning_rate": 1.3489555839020447e-05, "loss": 1.2881, "step": 14828 }, { "epoch": 0.4, "learning_rate": 1.3488726918949749e-05, "loss": 1.177, "step": 14829 }, { "epoch": 0.4, "learning_rate": 1.3487897971584892e-05, "loss": 1.3396, "step": 14830 }, { "epoch": 0.41, "learning_rate": 1.348706899693236e-05, "loss": 1.3938, "step": 14831 }, { "epoch": 0.41, "learning_rate": 1.3486239994998642e-05, "loss": 1.4136, "step": 14832 }, { "epoch": 0.41, "learning_rate": 1.3485410965790223e-05, "loss": 1.3125, "step": 14833 }, { "epoch": 0.41, "learning_rate": 1.3484581909313583e-05, "loss": 1.4224, "step": 14834 }, { "epoch": 0.41, "learning_rate": 1.3483752825575214e-05, "loss": 1.3464, "step": 14835 }, { "epoch": 0.41, "learning_rate": 1.3482923714581601e-05, "loss": 1.3691, "step": 14836 }, { "epoch": 0.41, "learning_rate": 1.3482094576339233e-05, "loss": 1.4146, "step": 14837 }, { "epoch": 0.41, "learning_rate": 1.3481265410854593e-05, "loss": 1.2524, "step": 14838 }, { "epoch": 0.41, "learning_rate": 1.348043621813417e-05, "loss": 1.2898, "step": 14839 }, { "epoch": 0.41, "learning_rate": 1.347960699818445e-05, "loss": 1.3867, "step": 14840 }, { "epoch": 0.41, "learning_rate": 1.3478777751011923e-05, "loss": 1.2949, "step": 14841 }, { "epoch": 0.41, "learning_rate": 1.3477948476623073e-05, "loss": 1.2788, "step": 14842 }, { "epoch": 0.41, "learning_rate": 1.3477119175024389e-05, "loss": 1.2808, "step": 14843 }, { "epoch": 0.41, "learning_rate": 1.3476289846222362e-05, "loss": 1.3701, "step": 14844 }, { "epoch": 0.41, "learning_rate": 1.3475460490223473e-05, "loss": 1.5056, "step": 14845 }, { "epoch": 0.41, "learning_rate": 1.347463110703422e-05, "loss": 1.3245, "step": 14846 }, { "epoch": 0.41, "learning_rate": 1.3473801696661086e-05, "loss": 1.354, "step": 14847 }, { "epoch": 0.41, "learning_rate": 1.3472972259110561e-05, "loss": 1.3145, "step": 14848 }, { "epoch": 0.41, "learning_rate": 1.3472142794389134e-05, "loss": 1.3569, "step": 14849 }, { "epoch": 0.41, "learning_rate": 1.3471313302503292e-05, "loss": 1.3359, "step": 14850 }, { "epoch": 0.41, "learning_rate": 1.347048378345953e-05, "loss": 1.4248, "step": 14851 }, { "epoch": 0.41, "learning_rate": 1.3469654237264333e-05, "loss": 1.2441, "step": 14852 }, { "epoch": 0.41, "learning_rate": 1.3468824663924197e-05, "loss": 1.3518, "step": 14853 }, { "epoch": 0.41, "learning_rate": 1.3467995063445602e-05, "loss": 1.2839, "step": 14854 }, { "epoch": 0.41, "learning_rate": 1.346716543583505e-05, "loss": 1.3135, "step": 14855 }, { "epoch": 0.41, "learning_rate": 1.3466335781099023e-05, "loss": 1.2905, "step": 14856 }, { "epoch": 0.41, "learning_rate": 1.3465506099244014e-05, "loss": 1.2705, "step": 14857 }, { "epoch": 0.41, "learning_rate": 1.3464676390276517e-05, "loss": 1.3489, "step": 14858 }, { "epoch": 0.41, "learning_rate": 1.3463846654203021e-05, "loss": 1.4009, "step": 14859 }, { "epoch": 0.41, "learning_rate": 1.3463016891030016e-05, "loss": 1.4512, "step": 14860 }, { "epoch": 0.41, "learning_rate": 1.3462187100763997e-05, "loss": 1.3638, "step": 14861 }, { "epoch": 0.41, "learning_rate": 1.3461357283411451e-05, "loss": 1.4155, "step": 14862 }, { "epoch": 0.41, "learning_rate": 1.3460527438978877e-05, "loss": 1.3394, "step": 14863 }, { "epoch": 0.41, "learning_rate": 1.3459697567472763e-05, "loss": 1.2649, "step": 14864 }, { "epoch": 0.41, "learning_rate": 1.3458867668899598e-05, "loss": 1.228, "step": 14865 }, { "epoch": 0.41, "learning_rate": 1.3458037743265882e-05, "loss": 1.3418, "step": 14866 }, { "epoch": 0.41, "learning_rate": 1.3457207790578106e-05, "loss": 1.2583, "step": 14867 }, { "epoch": 0.41, "learning_rate": 1.345637781084276e-05, "loss": 1.2617, "step": 14868 }, { "epoch": 0.41, "learning_rate": 1.345554780406634e-05, "loss": 1.2332, "step": 14869 }, { "epoch": 0.41, "learning_rate": 1.3454717770255338e-05, "loss": 1.2383, "step": 14870 }, { "epoch": 0.41, "learning_rate": 1.3453887709416251e-05, "loss": 1.2754, "step": 14871 }, { "epoch": 0.41, "learning_rate": 1.345305762155557e-05, "loss": 1.2998, "step": 14872 }, { "epoch": 0.41, "learning_rate": 1.345222750667979e-05, "loss": 1.3315, "step": 14873 }, { "epoch": 0.41, "learning_rate": 1.3451397364795403e-05, "loss": 1.4351, "step": 14874 }, { "epoch": 0.41, "learning_rate": 1.3450567195908908e-05, "loss": 1.3628, "step": 14875 }, { "epoch": 0.41, "learning_rate": 1.3449737000026797e-05, "loss": 1.4114, "step": 14876 }, { "epoch": 0.41, "learning_rate": 1.3448906777155567e-05, "loss": 1.2727, "step": 14877 }, { "epoch": 0.41, "learning_rate": 1.3448076527301712e-05, "loss": 1.6982, "step": 14878 }, { "epoch": 0.41, "learning_rate": 1.3447246250471727e-05, "loss": 1.3254, "step": 14879 }, { "epoch": 0.41, "learning_rate": 1.3446415946672104e-05, "loss": 1.3027, "step": 14880 }, { "epoch": 0.41, "learning_rate": 1.344558561590935e-05, "loss": 1.3594, "step": 14881 }, { "epoch": 0.41, "learning_rate": 1.3444755258189953e-05, "loss": 1.2583, "step": 14882 }, { "epoch": 0.41, "learning_rate": 1.3443924873520409e-05, "loss": 1.356, "step": 14883 }, { "epoch": 0.41, "learning_rate": 1.3443094461907216e-05, "loss": 1.2437, "step": 14884 }, { "epoch": 0.41, "learning_rate": 1.3442264023356874e-05, "loss": 1.3203, "step": 14885 }, { "epoch": 0.41, "learning_rate": 1.3441433557875874e-05, "loss": 1.4441, "step": 14886 }, { "epoch": 0.41, "learning_rate": 1.3440603065470717e-05, "loss": 1.2292, "step": 14887 }, { "epoch": 0.41, "learning_rate": 1.34397725461479e-05, "loss": 1.2451, "step": 14888 }, { "epoch": 0.41, "learning_rate": 1.3438941999913919e-05, "loss": 1.2468, "step": 14889 }, { "epoch": 0.41, "learning_rate": 1.3438111426775273e-05, "loss": 1.3955, "step": 14890 }, { "epoch": 0.41, "learning_rate": 1.3437280826738461e-05, "loss": 1.3857, "step": 14891 }, { "epoch": 0.41, "learning_rate": 1.3436450199809979e-05, "loss": 1.364, "step": 14892 }, { "epoch": 0.41, "learning_rate": 1.343561954599633e-05, "loss": 1.3623, "step": 14893 }, { "epoch": 0.41, "learning_rate": 1.3434788865304005e-05, "loss": 1.1501, "step": 14894 }, { "epoch": 0.41, "learning_rate": 1.3433958157739509e-05, "loss": 1.3789, "step": 14895 }, { "epoch": 0.41, "learning_rate": 1.3433127423309338e-05, "loss": 1.1465, "step": 14896 }, { "epoch": 0.41, "learning_rate": 1.343229666201999e-05, "loss": 1.3464, "step": 14897 }, { "epoch": 0.41, "learning_rate": 1.3431465873877972e-05, "loss": 1.2229, "step": 14898 }, { "epoch": 0.41, "learning_rate": 1.3430635058889776e-05, "loss": 1.1033, "step": 14899 }, { "epoch": 0.41, "learning_rate": 1.3429804217061904e-05, "loss": 1.3499, "step": 14900 }, { "epoch": 0.41, "learning_rate": 1.3428973348400857e-05, "loss": 1.4023, "step": 14901 }, { "epoch": 0.41, "learning_rate": 1.3428142452913136e-05, "loss": 1.2944, "step": 14902 }, { "epoch": 0.41, "learning_rate": 1.3427311530605241e-05, "loss": 1.3315, "step": 14903 }, { "epoch": 0.41, "learning_rate": 1.342648058148367e-05, "loss": 1.2017, "step": 14904 }, { "epoch": 0.41, "learning_rate": 1.342564960555493e-05, "loss": 1.1711, "step": 14905 }, { "epoch": 0.41, "learning_rate": 1.3424818602825513e-05, "loss": 1.2817, "step": 14906 }, { "epoch": 0.41, "learning_rate": 1.3423987573301931e-05, "loss": 1.4702, "step": 14907 }, { "epoch": 0.41, "learning_rate": 1.3423156516990676e-05, "loss": 1.3816, "step": 14908 }, { "epoch": 0.41, "learning_rate": 1.3422325433898259e-05, "loss": 1.3176, "step": 14909 }, { "epoch": 0.41, "learning_rate": 1.342149432403117e-05, "loss": 1.385, "step": 14910 }, { "epoch": 0.41, "learning_rate": 1.3420663187395921e-05, "loss": 1.1978, "step": 14911 }, { "epoch": 0.41, "learning_rate": 1.3419832023999016e-05, "loss": 1.2444, "step": 14912 }, { "epoch": 0.41, "learning_rate": 1.341900083384695e-05, "loss": 1.1821, "step": 14913 }, { "epoch": 0.41, "learning_rate": 1.3418169616946229e-05, "loss": 1.2513, "step": 14914 }, { "epoch": 0.41, "learning_rate": 1.3417338373303354e-05, "loss": 1.2246, "step": 14915 }, { "epoch": 0.41, "learning_rate": 1.3416507102924835e-05, "loss": 1.3828, "step": 14916 }, { "epoch": 0.41, "learning_rate": 1.341567580581717e-05, "loss": 1.272, "step": 14917 }, { "epoch": 0.41, "learning_rate": 1.3414844481986864e-05, "loss": 1.2871, "step": 14918 }, { "epoch": 0.41, "learning_rate": 1.3414013131440417e-05, "loss": 1.2668, "step": 14919 }, { "epoch": 0.41, "learning_rate": 1.3413181754184342e-05, "loss": 1.3867, "step": 14920 }, { "epoch": 0.41, "learning_rate": 1.3412350350225134e-05, "loss": 1.2817, "step": 14921 }, { "epoch": 0.41, "learning_rate": 1.3411518919569303e-05, "loss": 1.3345, "step": 14922 }, { "epoch": 0.41, "learning_rate": 1.3410687462223351e-05, "loss": 1.3987, "step": 14923 }, { "epoch": 0.41, "learning_rate": 1.3409855978193787e-05, "loss": 1.2568, "step": 14924 }, { "epoch": 0.41, "learning_rate": 1.3409024467487108e-05, "loss": 1.3633, "step": 14925 }, { "epoch": 0.41, "learning_rate": 1.3408192930109828e-05, "loss": 1.0532, "step": 14926 }, { "epoch": 0.41, "learning_rate": 1.3407361366068447e-05, "loss": 1.3796, "step": 14927 }, { "epoch": 0.41, "learning_rate": 1.3406529775369476e-05, "loss": 1.1384, "step": 14928 }, { "epoch": 0.41, "learning_rate": 1.3405698158019416e-05, "loss": 1.2244, "step": 14929 }, { "epoch": 0.41, "learning_rate": 1.3404866514024776e-05, "loss": 1.2703, "step": 14930 }, { "epoch": 0.41, "learning_rate": 1.3404034843392061e-05, "loss": 1.6938, "step": 14931 }, { "epoch": 0.41, "learning_rate": 1.3403203146127778e-05, "loss": 1.396, "step": 14932 }, { "epoch": 0.41, "learning_rate": 1.3402371422238436e-05, "loss": 1.5303, "step": 14933 }, { "epoch": 0.41, "learning_rate": 1.3401539671730536e-05, "loss": 1.3108, "step": 14934 }, { "epoch": 0.41, "learning_rate": 1.3400707894610593e-05, "loss": 1.3518, "step": 14935 }, { "epoch": 0.41, "learning_rate": 1.3399876090885108e-05, "loss": 1.2849, "step": 14936 }, { "epoch": 0.41, "learning_rate": 1.3399044260560593e-05, "loss": 1.2947, "step": 14937 }, { "epoch": 0.41, "learning_rate": 1.3398212403643554e-05, "loss": 1.4377, "step": 14938 }, { "epoch": 0.41, "learning_rate": 1.3397380520140497e-05, "loss": 1.4717, "step": 14939 }, { "epoch": 0.41, "learning_rate": 1.3396548610057934e-05, "loss": 1.3271, "step": 14940 }, { "epoch": 0.41, "learning_rate": 1.339571667340237e-05, "loss": 1.406, "step": 14941 }, { "epoch": 0.41, "learning_rate": 1.3394884710180316e-05, "loss": 1.2092, "step": 14942 }, { "epoch": 0.41, "learning_rate": 1.339405272039828e-05, "loss": 1.3538, "step": 14943 }, { "epoch": 0.41, "learning_rate": 1.3393220704062775e-05, "loss": 1.4719, "step": 14944 }, { "epoch": 0.41, "learning_rate": 1.3392388661180303e-05, "loss": 1.3545, "step": 14945 }, { "epoch": 0.41, "learning_rate": 1.339155659175738e-05, "loss": 1.3694, "step": 14946 }, { "epoch": 0.41, "learning_rate": 1.3390724495800511e-05, "loss": 1.302, "step": 14947 }, { "epoch": 0.41, "learning_rate": 1.3389892373316209e-05, "loss": 1.2893, "step": 14948 }, { "epoch": 0.41, "learning_rate": 1.3389060224310983e-05, "loss": 1.1936, "step": 14949 }, { "epoch": 0.41, "learning_rate": 1.3388228048791346e-05, "loss": 1.1946, "step": 14950 }, { "epoch": 0.41, "learning_rate": 1.3387395846763802e-05, "loss": 1.2373, "step": 14951 }, { "epoch": 0.41, "learning_rate": 1.3386563618234868e-05, "loss": 1.3022, "step": 14952 }, { "epoch": 0.41, "learning_rate": 1.338573136321105e-05, "loss": 1.3884, "step": 14953 }, { "epoch": 0.41, "learning_rate": 1.3384899081698866e-05, "loss": 1.3633, "step": 14954 }, { "epoch": 0.41, "learning_rate": 1.338406677370482e-05, "loss": 1.4419, "step": 14955 }, { "epoch": 0.41, "learning_rate": 1.3383234439235429e-05, "loss": 1.3818, "step": 14956 }, { "epoch": 0.41, "learning_rate": 1.3382402078297201e-05, "loss": 1.3896, "step": 14957 }, { "epoch": 0.41, "learning_rate": 1.338156969089665e-05, "loss": 1.2849, "step": 14958 }, { "epoch": 0.41, "learning_rate": 1.3380737277040288e-05, "loss": 1.2749, "step": 14959 }, { "epoch": 0.41, "learning_rate": 1.3379904836734627e-05, "loss": 1.4114, "step": 14960 }, { "epoch": 0.41, "learning_rate": 1.337907236998618e-05, "loss": 1.3008, "step": 14961 }, { "epoch": 0.41, "learning_rate": 1.337823987680146e-05, "loss": 1.3608, "step": 14962 }, { "epoch": 0.41, "learning_rate": 1.3377407357186983e-05, "loss": 1.2913, "step": 14963 }, { "epoch": 0.41, "learning_rate": 1.3376574811149254e-05, "loss": 1.3538, "step": 14964 }, { "epoch": 0.41, "learning_rate": 1.3375742238694796e-05, "loss": 1.2288, "step": 14965 }, { "epoch": 0.41, "learning_rate": 1.3374909639830112e-05, "loss": 1.4631, "step": 14966 }, { "epoch": 0.41, "learning_rate": 1.3374077014561726e-05, "loss": 1.3508, "step": 14967 }, { "epoch": 0.41, "learning_rate": 1.3373244362896148e-05, "loss": 1.3083, "step": 14968 }, { "epoch": 0.41, "learning_rate": 1.3372411684839893e-05, "loss": 1.417, "step": 14969 }, { "epoch": 0.41, "learning_rate": 1.3371578980399473e-05, "loss": 1.1733, "step": 14970 }, { "epoch": 0.41, "learning_rate": 1.3370746249581405e-05, "loss": 1.4846, "step": 14971 }, { "epoch": 0.41, "learning_rate": 1.3369913492392203e-05, "loss": 1.4094, "step": 14972 }, { "epoch": 0.41, "learning_rate": 1.3369080708838383e-05, "loss": 1.3176, "step": 14973 }, { "epoch": 0.41, "learning_rate": 1.3368247898926457e-05, "loss": 1.3889, "step": 14974 }, { "epoch": 0.41, "learning_rate": 1.3367415062662948e-05, "loss": 1.3022, "step": 14975 }, { "epoch": 0.41, "learning_rate": 1.3366582200054363e-05, "loss": 1.2578, "step": 14976 }, { "epoch": 0.41, "learning_rate": 1.3365749311107226e-05, "loss": 1.3694, "step": 14977 }, { "epoch": 0.41, "learning_rate": 1.3364916395828048e-05, "loss": 1.3201, "step": 14978 }, { "epoch": 0.41, "learning_rate": 1.3364083454223344e-05, "loss": 1.4009, "step": 14979 }, { "epoch": 0.41, "learning_rate": 1.3363250486299634e-05, "loss": 1.4375, "step": 14980 }, { "epoch": 0.41, "learning_rate": 1.3362417492063436e-05, "loss": 1.3511, "step": 14981 }, { "epoch": 0.41, "learning_rate": 1.336158447152126e-05, "loss": 1.252, "step": 14982 }, { "epoch": 0.41, "learning_rate": 1.3360751424679631e-05, "loss": 1.2542, "step": 14983 }, { "epoch": 0.41, "learning_rate": 1.3359918351545065e-05, "loss": 1.3835, "step": 14984 }, { "epoch": 0.41, "learning_rate": 1.3359085252124076e-05, "loss": 1.344, "step": 14985 }, { "epoch": 0.41, "learning_rate": 1.3358252126423182e-05, "loss": 1.2639, "step": 14986 }, { "epoch": 0.41, "learning_rate": 1.3357418974448904e-05, "loss": 1.1995, "step": 14987 }, { "epoch": 0.41, "learning_rate": 1.3356585796207758e-05, "loss": 1.1663, "step": 14988 }, { "epoch": 0.41, "learning_rate": 1.3355752591706262e-05, "loss": 1.2568, "step": 14989 }, { "epoch": 0.41, "learning_rate": 1.3354919360950937e-05, "loss": 1.394, "step": 14990 }, { "epoch": 0.41, "learning_rate": 1.33540861039483e-05, "loss": 1.3088, "step": 14991 }, { "epoch": 0.41, "learning_rate": 1.3353252820704871e-05, "loss": 1.1973, "step": 14992 }, { "epoch": 0.41, "learning_rate": 1.335241951122717e-05, "loss": 1.3367, "step": 14993 }, { "epoch": 0.41, "learning_rate": 1.3351586175521713e-05, "loss": 1.3877, "step": 14994 }, { "epoch": 0.41, "learning_rate": 1.3350752813595025e-05, "loss": 1.3972, "step": 14995 }, { "epoch": 0.41, "learning_rate": 1.3349919425453619e-05, "loss": 1.408, "step": 14996 }, { "epoch": 0.41, "learning_rate": 1.3349086011104022e-05, "loss": 1.1926, "step": 14997 }, { "epoch": 0.41, "learning_rate": 1.334825257055275e-05, "loss": 1.3154, "step": 14998 }, { "epoch": 0.41, "learning_rate": 1.3347419103806323e-05, "loss": 1.2734, "step": 14999 }, { "epoch": 0.41, "learning_rate": 1.3346585610871262e-05, "loss": 1.3713, "step": 15000 }, { "epoch": 0.41, "learning_rate": 1.3345752091754092e-05, "loss": 1.2329, "step": 15001 }, { "epoch": 0.41, "learning_rate": 1.3344918546461328e-05, "loss": 1.3057, "step": 15002 }, { "epoch": 0.41, "learning_rate": 1.3344084974999496e-05, "loss": 1.3162, "step": 15003 }, { "epoch": 0.41, "learning_rate": 1.3343251377375115e-05, "loss": 1.1836, "step": 15004 }, { "epoch": 0.41, "learning_rate": 1.3342417753594706e-05, "loss": 1.3579, "step": 15005 }, { "epoch": 0.41, "learning_rate": 1.3341584103664794e-05, "loss": 1.4351, "step": 15006 }, { "epoch": 0.41, "learning_rate": 1.3340750427591897e-05, "loss": 1.3315, "step": 15007 }, { "epoch": 0.41, "learning_rate": 1.3339916725382542e-05, "loss": 1.3921, "step": 15008 }, { "epoch": 0.41, "learning_rate": 1.333908299704325e-05, "loss": 1.4749, "step": 15009 }, { "epoch": 0.41, "learning_rate": 1.333824924258054e-05, "loss": 1.4036, "step": 15010 }, { "epoch": 0.41, "learning_rate": 1.333741546200094e-05, "loss": 1.3391, "step": 15011 }, { "epoch": 0.41, "learning_rate": 1.333658165531097e-05, "loss": 1.4231, "step": 15012 }, { "epoch": 0.41, "learning_rate": 1.3335747822517153e-05, "loss": 1.2134, "step": 15013 }, { "epoch": 0.41, "learning_rate": 1.3334913963626015e-05, "loss": 1.3657, "step": 15014 }, { "epoch": 0.41, "learning_rate": 1.3334080078644079e-05, "loss": 1.3494, "step": 15015 }, { "epoch": 0.41, "learning_rate": 1.3333246167577864e-05, "loss": 1.3396, "step": 15016 }, { "epoch": 0.41, "learning_rate": 1.3332412230433903e-05, "loss": 1.3892, "step": 15017 }, { "epoch": 0.41, "learning_rate": 1.3331578267218715e-05, "loss": 1.1582, "step": 15018 }, { "epoch": 0.41, "learning_rate": 1.3330744277938825e-05, "loss": 1.3547, "step": 15019 }, { "epoch": 0.41, "learning_rate": 1.3329910262600756e-05, "loss": 1.3408, "step": 15020 }, { "epoch": 0.41, "learning_rate": 1.3329076221211035e-05, "loss": 1.2583, "step": 15021 }, { "epoch": 0.41, "learning_rate": 1.332824215377619e-05, "loss": 1.2375, "step": 15022 }, { "epoch": 0.41, "learning_rate": 1.332740806030274e-05, "loss": 1.2913, "step": 15023 }, { "epoch": 0.41, "learning_rate": 1.3326573940797218e-05, "loss": 1.2678, "step": 15024 }, { "epoch": 0.41, "learning_rate": 1.3325739795266141e-05, "loss": 1.2292, "step": 15025 }, { "epoch": 0.41, "learning_rate": 1.3324905623716045e-05, "loss": 1.3613, "step": 15026 }, { "epoch": 0.41, "learning_rate": 1.3324071426153447e-05, "loss": 1.0378, "step": 15027 }, { "epoch": 0.41, "learning_rate": 1.332323720258488e-05, "loss": 1.3782, "step": 15028 }, { "epoch": 0.41, "learning_rate": 1.3322402953016864e-05, "loss": 1.4937, "step": 15029 }, { "epoch": 0.41, "learning_rate": 1.3321568677455934e-05, "loss": 1.3691, "step": 15030 }, { "epoch": 0.41, "learning_rate": 1.3320734375908608e-05, "loss": 1.3428, "step": 15031 }, { "epoch": 0.41, "learning_rate": 1.3319900048381422e-05, "loss": 1.3577, "step": 15032 }, { "epoch": 0.41, "learning_rate": 1.3319065694880897e-05, "loss": 1.2625, "step": 15033 }, { "epoch": 0.41, "learning_rate": 1.3318231315413566e-05, "loss": 1.3142, "step": 15034 }, { "epoch": 0.41, "learning_rate": 1.3317396909985947e-05, "loss": 1.353, "step": 15035 }, { "epoch": 0.41, "learning_rate": 1.3316562478604578e-05, "loss": 1.2053, "step": 15036 }, { "epoch": 0.41, "learning_rate": 1.3315728021275984e-05, "loss": 1.3967, "step": 15037 }, { "epoch": 0.41, "learning_rate": 1.3314893538006694e-05, "loss": 1.312, "step": 15038 }, { "epoch": 0.41, "learning_rate": 1.3314059028803233e-05, "loss": 1.3574, "step": 15039 }, { "epoch": 0.41, "learning_rate": 1.3313224493672137e-05, "loss": 1.4043, "step": 15040 }, { "epoch": 0.41, "learning_rate": 1.3312389932619927e-05, "loss": 1.2917, "step": 15041 }, { "epoch": 0.41, "learning_rate": 1.3311555345653138e-05, "loss": 1.3562, "step": 15042 }, { "epoch": 0.41, "learning_rate": 1.3310720732778295e-05, "loss": 1.1953, "step": 15043 }, { "epoch": 0.41, "learning_rate": 1.3309886094001932e-05, "loss": 1.344, "step": 15044 }, { "epoch": 0.41, "learning_rate": 1.3309051429330572e-05, "loss": 1.343, "step": 15045 }, { "epoch": 0.41, "learning_rate": 1.3308216738770754e-05, "loss": 1.1921, "step": 15046 }, { "epoch": 0.41, "learning_rate": 1.3307382022329003e-05, "loss": 1.4302, "step": 15047 }, { "epoch": 0.41, "learning_rate": 1.330654728001185e-05, "loss": 1.4307, "step": 15048 }, { "epoch": 0.41, "learning_rate": 1.3305712511825826e-05, "loss": 1.188, "step": 15049 }, { "epoch": 0.41, "learning_rate": 1.3304877717777462e-05, "loss": 1.3601, "step": 15050 }, { "epoch": 0.41, "learning_rate": 1.3304042897873286e-05, "loss": 1.3726, "step": 15051 }, { "epoch": 0.41, "learning_rate": 1.3303208052119836e-05, "loss": 1.7192, "step": 15052 }, { "epoch": 0.41, "learning_rate": 1.3302373180523635e-05, "loss": 1.282, "step": 15053 }, { "epoch": 0.41, "learning_rate": 1.3301538283091225e-05, "loss": 1.2744, "step": 15054 }, { "epoch": 0.41, "learning_rate": 1.3300703359829128e-05, "loss": 1.4121, "step": 15055 }, { "epoch": 0.41, "learning_rate": 1.3299868410743883e-05, "loss": 1.4102, "step": 15056 }, { "epoch": 0.41, "learning_rate": 1.3299033435842015e-05, "loss": 1.2898, "step": 15057 }, { "epoch": 0.41, "learning_rate": 1.3298198435130065e-05, "loss": 1.3176, "step": 15058 }, { "epoch": 0.41, "learning_rate": 1.3297363408614558e-05, "loss": 1.3784, "step": 15059 }, { "epoch": 0.41, "learning_rate": 1.3296528356302035e-05, "loss": 1.3237, "step": 15060 }, { "epoch": 0.41, "learning_rate": 1.3295693278199018e-05, "loss": 1.4321, "step": 15061 }, { "epoch": 0.41, "learning_rate": 1.329485817431205e-05, "loss": 1.271, "step": 15062 }, { "epoch": 0.41, "learning_rate": 1.3294023044647662e-05, "loss": 1.3799, "step": 15063 }, { "epoch": 0.41, "learning_rate": 1.3293187889212384e-05, "loss": 1.4165, "step": 15064 }, { "epoch": 0.41, "learning_rate": 1.3292352708012754e-05, "loss": 1.2358, "step": 15065 }, { "epoch": 0.41, "learning_rate": 1.3291517501055302e-05, "loss": 1.3206, "step": 15066 }, { "epoch": 0.41, "learning_rate": 1.3290682268346569e-05, "loss": 1.3633, "step": 15067 }, { "epoch": 0.41, "learning_rate": 1.3289847009893082e-05, "loss": 1.1812, "step": 15068 }, { "epoch": 0.41, "learning_rate": 1.3289011725701382e-05, "loss": 1.2556, "step": 15069 }, { "epoch": 0.41, "learning_rate": 1.3288176415777998e-05, "loss": 1.3604, "step": 15070 }, { "epoch": 0.41, "learning_rate": 1.328734108012947e-05, "loss": 1.3691, "step": 15071 }, { "epoch": 0.41, "learning_rate": 1.3286505718762331e-05, "loss": 1.2971, "step": 15072 }, { "epoch": 0.41, "learning_rate": 1.3285670331683118e-05, "loss": 1.2957, "step": 15073 }, { "epoch": 0.41, "learning_rate": 1.3284834918898362e-05, "loss": 1.4585, "step": 15074 }, { "epoch": 0.41, "learning_rate": 1.3283999480414605e-05, "loss": 1.2158, "step": 15075 }, { "epoch": 0.41, "learning_rate": 1.3283164016238377e-05, "loss": 1.3523, "step": 15076 }, { "epoch": 0.41, "learning_rate": 1.3282328526376221e-05, "loss": 1.2146, "step": 15077 }, { "epoch": 0.41, "learning_rate": 1.3281493010834667e-05, "loss": 1.1936, "step": 15078 }, { "epoch": 0.41, "learning_rate": 1.3280657469620257e-05, "loss": 1.1633, "step": 15079 }, { "epoch": 0.41, "learning_rate": 1.3279821902739524e-05, "loss": 1.2388, "step": 15080 }, { "epoch": 0.41, "learning_rate": 1.3278986310199011e-05, "loss": 1.2268, "step": 15081 }, { "epoch": 0.41, "learning_rate": 1.3278150692005243e-05, "loss": 1.2737, "step": 15082 }, { "epoch": 0.41, "learning_rate": 1.3277315048164772e-05, "loss": 1.1868, "step": 15083 }, { "epoch": 0.41, "learning_rate": 1.3276479378684126e-05, "loss": 1.6895, "step": 15084 }, { "epoch": 0.41, "learning_rate": 1.327564368356985e-05, "loss": 1.2783, "step": 15085 }, { "epoch": 0.41, "learning_rate": 1.3274807962828473e-05, "loss": 1.3076, "step": 15086 }, { "epoch": 0.41, "learning_rate": 1.3273972216466544e-05, "loss": 1.2095, "step": 15087 }, { "epoch": 0.41, "learning_rate": 1.327313644449059e-05, "loss": 1.1146, "step": 15088 }, { "epoch": 0.41, "learning_rate": 1.3272300646907161e-05, "loss": 1.356, "step": 15089 }, { "epoch": 0.41, "learning_rate": 1.3271464823722787e-05, "loss": 1.3115, "step": 15090 }, { "epoch": 0.41, "learning_rate": 1.3270628974944014e-05, "loss": 1.2451, "step": 15091 }, { "epoch": 0.41, "learning_rate": 1.3269793100577374e-05, "loss": 1.2205, "step": 15092 }, { "epoch": 0.41, "learning_rate": 1.3268957200629413e-05, "loss": 1.4558, "step": 15093 }, { "epoch": 0.41, "learning_rate": 1.3268121275106664e-05, "loss": 1.3091, "step": 15094 }, { "epoch": 0.41, "learning_rate": 1.3267285324015676e-05, "loss": 1.3303, "step": 15095 }, { "epoch": 0.41, "learning_rate": 1.326644934736298e-05, "loss": 1.4365, "step": 15096 }, { "epoch": 0.41, "learning_rate": 1.3265613345155122e-05, "loss": 1.3096, "step": 15097 }, { "epoch": 0.41, "learning_rate": 1.326477731739864e-05, "loss": 1.4131, "step": 15098 }, { "epoch": 0.41, "learning_rate": 1.3263941264100076e-05, "loss": 1.3521, "step": 15099 }, { "epoch": 0.41, "learning_rate": 1.3263105185265969e-05, "loss": 1.3689, "step": 15100 }, { "epoch": 0.41, "learning_rate": 1.3262269080902865e-05, "loss": 1.2114, "step": 15101 }, { "epoch": 0.41, "learning_rate": 1.32614329510173e-05, "loss": 1.2598, "step": 15102 }, { "epoch": 0.41, "learning_rate": 1.3260596795615817e-05, "loss": 1.3311, "step": 15103 }, { "epoch": 0.41, "learning_rate": 1.3259760614704958e-05, "loss": 1.2412, "step": 15104 }, { "epoch": 0.41, "learning_rate": 1.3258924408291265e-05, "loss": 1.2969, "step": 15105 }, { "epoch": 0.41, "learning_rate": 1.3258088176381279e-05, "loss": 1.2367, "step": 15106 }, { "epoch": 0.41, "learning_rate": 1.3257251918981546e-05, "loss": 1.2151, "step": 15107 }, { "epoch": 0.41, "learning_rate": 1.3256415636098602e-05, "loss": 1.3206, "step": 15108 }, { "epoch": 0.41, "learning_rate": 1.3255579327738997e-05, "loss": 1.3645, "step": 15109 }, { "epoch": 0.41, "learning_rate": 1.3254742993909267e-05, "loss": 1.2966, "step": 15110 }, { "epoch": 0.41, "learning_rate": 1.3253906634615961e-05, "loss": 1.22, "step": 15111 }, { "epoch": 0.41, "learning_rate": 1.3253070249865615e-05, "loss": 1.2349, "step": 15112 }, { "epoch": 0.41, "learning_rate": 1.3252233839664779e-05, "loss": 1.386, "step": 15113 }, { "epoch": 0.41, "learning_rate": 1.3251397404019996e-05, "loss": 1.3015, "step": 15114 }, { "epoch": 0.41, "learning_rate": 1.325056094293781e-05, "loss": 1.3833, "step": 15115 }, { "epoch": 0.41, "learning_rate": 1.3249724456424763e-05, "loss": 1.3896, "step": 15116 }, { "epoch": 0.41, "learning_rate": 1.3248887944487397e-05, "loss": 1.2954, "step": 15117 }, { "epoch": 0.41, "learning_rate": 1.3248051407132263e-05, "loss": 1.2256, "step": 15118 }, { "epoch": 0.41, "learning_rate": 1.3247214844365899e-05, "loss": 1.4631, "step": 15119 }, { "epoch": 0.41, "learning_rate": 1.3246378256194856e-05, "loss": 1.3748, "step": 15120 }, { "epoch": 0.41, "learning_rate": 1.3245541642625675e-05, "loss": 1.251, "step": 15121 }, { "epoch": 0.41, "learning_rate": 1.3244705003664902e-05, "loss": 1.2129, "step": 15122 }, { "epoch": 0.41, "learning_rate": 1.324386833931908e-05, "loss": 1.4189, "step": 15123 }, { "epoch": 0.41, "learning_rate": 1.3243031649594765e-05, "loss": 1.2087, "step": 15124 }, { "epoch": 0.41, "learning_rate": 1.324219493449849e-05, "loss": 1.2053, "step": 15125 }, { "epoch": 0.41, "learning_rate": 1.3241358194036807e-05, "loss": 1.3252, "step": 15126 }, { "epoch": 0.41, "learning_rate": 1.324052142821626e-05, "loss": 1.4451, "step": 15127 }, { "epoch": 0.41, "learning_rate": 1.3239684637043397e-05, "loss": 1.3257, "step": 15128 }, { "epoch": 0.41, "learning_rate": 1.3238847820524768e-05, "loss": 1.1235, "step": 15129 }, { "epoch": 0.41, "learning_rate": 1.3238010978666916e-05, "loss": 1.3477, "step": 15130 }, { "epoch": 0.41, "learning_rate": 1.3237174111476388e-05, "loss": 1.2976, "step": 15131 }, { "epoch": 0.41, "learning_rate": 1.3236337218959733e-05, "loss": 1.2725, "step": 15132 }, { "epoch": 0.41, "learning_rate": 1.3235500301123496e-05, "loss": 1.1301, "step": 15133 }, { "epoch": 0.41, "learning_rate": 1.3234663357974227e-05, "loss": 1.2375, "step": 15134 }, { "epoch": 0.41, "learning_rate": 1.3233826389518472e-05, "loss": 1.342, "step": 15135 }, { "epoch": 0.41, "learning_rate": 1.323298939576278e-05, "loss": 1.7183, "step": 15136 }, { "epoch": 0.41, "learning_rate": 1.32321523767137e-05, "loss": 1.1987, "step": 15137 }, { "epoch": 0.41, "learning_rate": 1.3231315332377781e-05, "loss": 1.3455, "step": 15138 }, { "epoch": 0.41, "learning_rate": 1.3230478262761568e-05, "loss": 1.2529, "step": 15139 }, { "epoch": 0.41, "learning_rate": 1.3229641167871613e-05, "loss": 1.2524, "step": 15140 }, { "epoch": 0.41, "learning_rate": 1.3228804047714462e-05, "loss": 1.4119, "step": 15141 }, { "epoch": 0.41, "learning_rate": 1.3227966902296671e-05, "loss": 1.5344, "step": 15142 }, { "epoch": 0.41, "learning_rate": 1.3227129731624781e-05, "loss": 1.3721, "step": 15143 }, { "epoch": 0.41, "learning_rate": 1.3226292535705348e-05, "loss": 1.3652, "step": 15144 }, { "epoch": 0.41, "learning_rate": 1.3225455314544915e-05, "loss": 1.3665, "step": 15145 }, { "epoch": 0.41, "learning_rate": 1.3224618068150041e-05, "loss": 1.239, "step": 15146 }, { "epoch": 0.41, "learning_rate": 1.322378079652727e-05, "loss": 1.4036, "step": 15147 }, { "epoch": 0.41, "learning_rate": 1.3222943499683156e-05, "loss": 1.3396, "step": 15148 }, { "epoch": 0.41, "learning_rate": 1.3222106177624244e-05, "loss": 1.3025, "step": 15149 }, { "epoch": 0.41, "learning_rate": 1.322126883035709e-05, "loss": 1.394, "step": 15150 }, { "epoch": 0.41, "learning_rate": 1.3220431457888243e-05, "loss": 1.1881, "step": 15151 }, { "epoch": 0.41, "learning_rate": 1.3219594060224258e-05, "loss": 1.3481, "step": 15152 }, { "epoch": 0.41, "learning_rate": 1.3218756637371679e-05, "loss": 1.3396, "step": 15153 }, { "epoch": 0.41, "learning_rate": 1.3217919189337063e-05, "loss": 1.2488, "step": 15154 }, { "epoch": 0.41, "learning_rate": 1.3217081716126959e-05, "loss": 1.2124, "step": 15155 }, { "epoch": 0.41, "learning_rate": 1.3216244217747925e-05, "loss": 1.3679, "step": 15156 }, { "epoch": 0.41, "learning_rate": 1.3215406694206503e-05, "loss": 1.2168, "step": 15157 }, { "epoch": 0.41, "learning_rate": 1.3214569145509253e-05, "loss": 1.25, "step": 15158 }, { "epoch": 0.41, "learning_rate": 1.3213731571662724e-05, "loss": 1.322, "step": 15159 }, { "epoch": 0.41, "learning_rate": 1.3212893972673472e-05, "loss": 1.262, "step": 15160 }, { "epoch": 0.41, "learning_rate": 1.3212056348548049e-05, "loss": 1.175, "step": 15161 }, { "epoch": 0.41, "learning_rate": 1.3211218699293009e-05, "loss": 1.1567, "step": 15162 }, { "epoch": 0.41, "learning_rate": 1.32103810249149e-05, "loss": 1.4578, "step": 15163 }, { "epoch": 0.41, "learning_rate": 1.3209543325420282e-05, "loss": 1.1748, "step": 15164 }, { "epoch": 0.41, "learning_rate": 1.3208705600815706e-05, "loss": 1.2373, "step": 15165 }, { "epoch": 0.41, "learning_rate": 1.3207867851107727e-05, "loss": 1.2898, "step": 15166 }, { "epoch": 0.41, "learning_rate": 1.3207030076302896e-05, "loss": 1.3975, "step": 15167 }, { "epoch": 0.41, "learning_rate": 1.3206192276407773e-05, "loss": 1.2632, "step": 15168 }, { "epoch": 0.41, "learning_rate": 1.3205354451428906e-05, "loss": 1.3184, "step": 15169 }, { "epoch": 0.41, "learning_rate": 1.3204516601372856e-05, "loss": 1.3625, "step": 15170 }, { "epoch": 0.41, "learning_rate": 1.3203678726246171e-05, "loss": 1.23, "step": 15171 }, { "epoch": 0.41, "learning_rate": 1.3202840826055417e-05, "loss": 1.1129, "step": 15172 }, { "epoch": 0.41, "learning_rate": 1.3202002900807136e-05, "loss": 1.2185, "step": 15173 }, { "epoch": 0.41, "learning_rate": 1.3201164950507893e-05, "loss": 1.4321, "step": 15174 }, { "epoch": 0.41, "learning_rate": 1.3200326975164237e-05, "loss": 1.1324, "step": 15175 }, { "epoch": 0.41, "learning_rate": 1.3199488974782731e-05, "loss": 1.3149, "step": 15176 }, { "epoch": 0.41, "learning_rate": 1.3198650949369929e-05, "loss": 1.4617, "step": 15177 }, { "epoch": 0.41, "learning_rate": 1.3197812898932383e-05, "loss": 1.4028, "step": 15178 }, { "epoch": 0.41, "learning_rate": 1.3196974823476654e-05, "loss": 1.3225, "step": 15179 }, { "epoch": 0.41, "learning_rate": 1.3196136723009296e-05, "loss": 1.2205, "step": 15180 }, { "epoch": 0.41, "learning_rate": 1.319529859753687e-05, "loss": 1.501, "step": 15181 }, { "epoch": 0.41, "learning_rate": 1.3194460447065929e-05, "loss": 1.3423, "step": 15182 }, { "epoch": 0.41, "learning_rate": 1.3193622271603031e-05, "loss": 1.1428, "step": 15183 }, { "epoch": 0.41, "learning_rate": 1.3192784071154735e-05, "loss": 1.3469, "step": 15184 }, { "epoch": 0.41, "learning_rate": 1.3191945845727596e-05, "loss": 1.2341, "step": 15185 }, { "epoch": 0.41, "learning_rate": 1.3191107595328175e-05, "loss": 1.4158, "step": 15186 }, { "epoch": 0.41, "learning_rate": 1.319026931996303e-05, "loss": 1.3445, "step": 15187 }, { "epoch": 0.41, "learning_rate": 1.3189431019638717e-05, "loss": 1.2175, "step": 15188 }, { "epoch": 0.41, "learning_rate": 1.3188592694361795e-05, "loss": 1.2571, "step": 15189 }, { "epoch": 0.41, "learning_rate": 1.3187754344138819e-05, "loss": 1.3564, "step": 15190 }, { "epoch": 0.41, "learning_rate": 1.3186915968976357e-05, "loss": 1.395, "step": 15191 }, { "epoch": 0.41, "learning_rate": 1.3186077568880962e-05, "loss": 1.238, "step": 15192 }, { "epoch": 0.41, "learning_rate": 1.3185239143859197e-05, "loss": 1.2983, "step": 15193 }, { "epoch": 0.41, "learning_rate": 1.3184400693917614e-05, "loss": 1.2646, "step": 15194 }, { "epoch": 0.41, "learning_rate": 1.318356221906278e-05, "loss": 1.3157, "step": 15195 }, { "epoch": 0.41, "learning_rate": 1.318272371930125e-05, "loss": 1.2495, "step": 15196 }, { "epoch": 0.42, "learning_rate": 1.3181885194639591e-05, "loss": 1.1814, "step": 15197 }, { "epoch": 0.42, "learning_rate": 1.3181046645084354e-05, "loss": 1.4307, "step": 15198 }, { "epoch": 0.42, "learning_rate": 1.3180208070642109e-05, "loss": 1.2429, "step": 15199 }, { "epoch": 0.42, "learning_rate": 1.3179369471319405e-05, "loss": 1.2266, "step": 15200 }, { "epoch": 0.42, "learning_rate": 1.3178530847122815e-05, "loss": 1.4248, "step": 15201 }, { "epoch": 0.42, "learning_rate": 1.3177692198058889e-05, "loss": 1.1948, "step": 15202 }, { "epoch": 0.42, "learning_rate": 1.3176853524134198e-05, "loss": 1.2732, "step": 15203 }, { "epoch": 0.42, "learning_rate": 1.3176014825355296e-05, "loss": 1.3745, "step": 15204 }, { "epoch": 0.42, "learning_rate": 1.317517610172875e-05, "loss": 1.3269, "step": 15205 }, { "epoch": 0.42, "learning_rate": 1.3174337353261115e-05, "loss": 1.3652, "step": 15206 }, { "epoch": 0.42, "learning_rate": 1.317349857995896e-05, "loss": 1.377, "step": 15207 }, { "epoch": 0.42, "learning_rate": 1.3172659781828842e-05, "loss": 1.3052, "step": 15208 }, { "epoch": 0.42, "learning_rate": 1.317182095887733e-05, "loss": 1.4263, "step": 15209 }, { "epoch": 0.42, "learning_rate": 1.3170982111110979e-05, "loss": 1.1902, "step": 15210 }, { "epoch": 0.42, "learning_rate": 1.3170143238536359e-05, "loss": 1.2065, "step": 15211 }, { "epoch": 0.42, "learning_rate": 1.3169304341160025e-05, "loss": 1.3865, "step": 15212 }, { "epoch": 0.42, "learning_rate": 1.3168465418988548e-05, "loss": 1.4436, "step": 15213 }, { "epoch": 0.42, "learning_rate": 1.3167626472028483e-05, "loss": 1.4167, "step": 15214 }, { "epoch": 0.42, "learning_rate": 1.3166787500286402e-05, "loss": 1.3057, "step": 15215 }, { "epoch": 0.42, "learning_rate": 1.3165948503768861e-05, "loss": 1.3994, "step": 15216 }, { "epoch": 0.42, "learning_rate": 1.316510948248243e-05, "loss": 1.3328, "step": 15217 }, { "epoch": 0.42, "learning_rate": 1.3164270436433668e-05, "loss": 1.3044, "step": 15218 }, { "epoch": 0.42, "learning_rate": 1.3163431365629147e-05, "loss": 1.2935, "step": 15219 }, { "epoch": 0.42, "learning_rate": 1.3162592270075423e-05, "loss": 1.2561, "step": 15220 }, { "epoch": 0.42, "learning_rate": 1.3161753149779064e-05, "loss": 1.238, "step": 15221 }, { "epoch": 0.42, "learning_rate": 1.3160914004746637e-05, "loss": 1.3667, "step": 15222 }, { "epoch": 0.42, "learning_rate": 1.3160074834984703e-05, "loss": 1.3435, "step": 15223 }, { "epoch": 0.42, "learning_rate": 1.3159235640499831e-05, "loss": 1.2913, "step": 15224 }, { "epoch": 0.42, "learning_rate": 1.3158396421298586e-05, "loss": 1.1633, "step": 15225 }, { "epoch": 0.42, "learning_rate": 1.3157557177387532e-05, "loss": 1.3613, "step": 15226 }, { "epoch": 0.42, "learning_rate": 1.3156717908773233e-05, "loss": 1.374, "step": 15227 }, { "epoch": 0.42, "learning_rate": 1.3155878615462261e-05, "loss": 1.1829, "step": 15228 }, { "epoch": 0.42, "learning_rate": 1.3155039297461176e-05, "loss": 1.2078, "step": 15229 }, { "epoch": 0.42, "learning_rate": 1.315419995477655e-05, "loss": 1.2168, "step": 15230 }, { "epoch": 0.42, "learning_rate": 1.3153360587414942e-05, "loss": 1.4927, "step": 15231 }, { "epoch": 0.42, "learning_rate": 1.3152521195382927e-05, "loss": 1.3169, "step": 15232 }, { "epoch": 0.42, "learning_rate": 1.315168177868707e-05, "loss": 1.7549, "step": 15233 }, { "epoch": 0.42, "learning_rate": 1.3150842337333934e-05, "loss": 1.4114, "step": 15234 }, { "epoch": 0.42, "learning_rate": 1.3150002871330089e-05, "loss": 1.1746, "step": 15235 }, { "epoch": 0.42, "learning_rate": 1.3149163380682105e-05, "loss": 1.3188, "step": 15236 }, { "epoch": 0.42, "learning_rate": 1.3148323865396544e-05, "loss": 1.2898, "step": 15237 }, { "epoch": 0.42, "learning_rate": 1.314748432547998e-05, "loss": 1.2571, "step": 15238 }, { "epoch": 0.42, "learning_rate": 1.3146644760938978e-05, "loss": 1.4087, "step": 15239 }, { "epoch": 0.42, "learning_rate": 1.3145805171780109e-05, "loss": 1.3345, "step": 15240 }, { "epoch": 0.42, "learning_rate": 1.3144965558009937e-05, "loss": 1.2877, "step": 15241 }, { "epoch": 0.42, "learning_rate": 1.3144125919635036e-05, "loss": 1.272, "step": 15242 }, { "epoch": 0.42, "learning_rate": 1.3143286256661969e-05, "loss": 1.418, "step": 15243 }, { "epoch": 0.42, "learning_rate": 1.3142446569097311e-05, "loss": 1.3315, "step": 15244 }, { "epoch": 0.42, "learning_rate": 1.3141606856947627e-05, "loss": 1.3115, "step": 15245 }, { "epoch": 0.42, "learning_rate": 1.314076712021949e-05, "loss": 1.686, "step": 15246 }, { "epoch": 0.42, "learning_rate": 1.3139927358919466e-05, "loss": 1.1631, "step": 15247 }, { "epoch": 0.42, "learning_rate": 1.313908757305413e-05, "loss": 1.3567, "step": 15248 }, { "epoch": 0.42, "learning_rate": 1.3138247762630045e-05, "loss": 1.3267, "step": 15249 }, { "epoch": 0.42, "learning_rate": 1.3137407927653789e-05, "loss": 1.4041, "step": 15250 }, { "epoch": 0.42, "learning_rate": 1.3136568068131925e-05, "loss": 1.3662, "step": 15251 }, { "epoch": 0.42, "learning_rate": 1.3135728184071029e-05, "loss": 1.186, "step": 15252 }, { "epoch": 0.42, "learning_rate": 1.3134888275477668e-05, "loss": 1.3335, "step": 15253 }, { "epoch": 0.42, "learning_rate": 1.3134048342358421e-05, "loss": 1.3411, "step": 15254 }, { "epoch": 0.42, "learning_rate": 1.3133208384719849e-05, "loss": 1.1841, "step": 15255 }, { "epoch": 0.42, "learning_rate": 1.313236840256853e-05, "loss": 1.376, "step": 15256 }, { "epoch": 0.42, "learning_rate": 1.313152839591103e-05, "loss": 1.2375, "step": 15257 }, { "epoch": 0.42, "learning_rate": 1.3130688364753929e-05, "loss": 1.7725, "step": 15258 }, { "epoch": 0.42, "learning_rate": 1.312984830910379e-05, "loss": 1.2959, "step": 15259 }, { "epoch": 0.42, "learning_rate": 1.3129008228967193e-05, "loss": 1.2297, "step": 15260 }, { "epoch": 0.42, "learning_rate": 1.3128168124350706e-05, "loss": 1.335, "step": 15261 }, { "epoch": 0.42, "learning_rate": 1.3127327995260904e-05, "loss": 1.4314, "step": 15262 }, { "epoch": 0.42, "learning_rate": 1.3126487841704356e-05, "loss": 1.3203, "step": 15263 }, { "epoch": 0.42, "learning_rate": 1.3125647663687637e-05, "loss": 1.1973, "step": 15264 }, { "epoch": 0.42, "learning_rate": 1.3124807461217322e-05, "loss": 1.3823, "step": 15265 }, { "epoch": 0.42, "learning_rate": 1.3123967234299984e-05, "loss": 1.2007, "step": 15266 }, { "epoch": 0.42, "learning_rate": 1.3123126982942193e-05, "loss": 1.1748, "step": 15267 }, { "epoch": 0.42, "learning_rate": 1.3122286707150524e-05, "loss": 1.4485, "step": 15268 }, { "epoch": 0.42, "learning_rate": 1.3121446406931555e-05, "loss": 1.3145, "step": 15269 }, { "epoch": 0.42, "learning_rate": 1.3120606082291855e-05, "loss": 1.2371, "step": 15270 }, { "epoch": 0.42, "learning_rate": 1.3119765733238003e-05, "loss": 1.2874, "step": 15271 }, { "epoch": 0.42, "learning_rate": 1.311892535977657e-05, "loss": 1.3894, "step": 15272 }, { "epoch": 0.42, "learning_rate": 1.311808496191413e-05, "loss": 1.3364, "step": 15273 }, { "epoch": 0.42, "learning_rate": 1.311724453965726e-05, "loss": 1.156, "step": 15274 }, { "epoch": 0.42, "learning_rate": 1.3116404093012535e-05, "loss": 1.3196, "step": 15275 }, { "epoch": 0.42, "learning_rate": 1.311556362198653e-05, "loss": 1.3499, "step": 15276 }, { "epoch": 0.42, "learning_rate": 1.3114723126585818e-05, "loss": 1.2905, "step": 15277 }, { "epoch": 0.42, "learning_rate": 1.311388260681698e-05, "loss": 1.373, "step": 15278 }, { "epoch": 0.42, "learning_rate": 1.3113042062686587e-05, "loss": 1.2959, "step": 15279 }, { "epoch": 0.42, "learning_rate": 1.3112201494201218e-05, "loss": 1.2358, "step": 15280 }, { "epoch": 0.42, "learning_rate": 1.3111360901367446e-05, "loss": 1.3308, "step": 15281 }, { "epoch": 0.42, "learning_rate": 1.3110520284191852e-05, "loss": 1.1843, "step": 15282 }, { "epoch": 0.42, "learning_rate": 1.3109679642681007e-05, "loss": 1.1399, "step": 15283 }, { "epoch": 0.42, "learning_rate": 1.3108838976841493e-05, "loss": 1.4692, "step": 15284 }, { "epoch": 0.42, "learning_rate": 1.3107998286679887e-05, "loss": 1.71, "step": 15285 }, { "epoch": 0.42, "learning_rate": 1.310715757220276e-05, "loss": 1.3298, "step": 15286 }, { "epoch": 0.42, "learning_rate": 1.3106316833416695e-05, "loss": 1.3816, "step": 15287 }, { "epoch": 0.42, "learning_rate": 1.3105476070328264e-05, "loss": 1.2837, "step": 15288 }, { "epoch": 0.42, "learning_rate": 1.3104635282944054e-05, "loss": 1.4304, "step": 15289 }, { "epoch": 0.42, "learning_rate": 1.3103794471270634e-05, "loss": 1.3813, "step": 15290 }, { "epoch": 0.42, "learning_rate": 1.3102953635314588e-05, "loss": 1.2957, "step": 15291 }, { "epoch": 0.42, "learning_rate": 1.310211277508249e-05, "loss": 1.5103, "step": 15292 }, { "epoch": 0.42, "learning_rate": 1.310127189058092e-05, "loss": 1.3574, "step": 15293 }, { "epoch": 0.42, "learning_rate": 1.3100430981816458e-05, "loss": 1.2419, "step": 15294 }, { "epoch": 0.42, "learning_rate": 1.3099590048795683e-05, "loss": 1.3269, "step": 15295 }, { "epoch": 0.42, "learning_rate": 1.3098749091525172e-05, "loss": 1.2188, "step": 15296 }, { "epoch": 0.42, "learning_rate": 1.3097908110011506e-05, "loss": 1.3953, "step": 15297 }, { "epoch": 0.42, "learning_rate": 1.309706710426126e-05, "loss": 1.2866, "step": 15298 }, { "epoch": 0.42, "learning_rate": 1.309622607428102e-05, "loss": 1.3735, "step": 15299 }, { "epoch": 0.42, "learning_rate": 1.3095385020077363e-05, "loss": 1.2693, "step": 15300 }, { "epoch": 0.42, "learning_rate": 1.309454394165687e-05, "loss": 1.4258, "step": 15301 }, { "epoch": 0.42, "learning_rate": 1.309370283902612e-05, "loss": 1.2458, "step": 15302 }, { "epoch": 0.42, "learning_rate": 1.3092861712191693e-05, "loss": 1.4097, "step": 15303 }, { "epoch": 0.42, "learning_rate": 1.309202056116017e-05, "loss": 1.3259, "step": 15304 }, { "epoch": 0.42, "learning_rate": 1.3091179385938135e-05, "loss": 1.1521, "step": 15305 }, { "epoch": 0.42, "learning_rate": 1.3090338186532164e-05, "loss": 1.2764, "step": 15306 }, { "epoch": 0.42, "learning_rate": 1.308949696294884e-05, "loss": 1.312, "step": 15307 }, { "epoch": 0.42, "learning_rate": 1.3088655715194745e-05, "loss": 1.189, "step": 15308 }, { "epoch": 0.42, "learning_rate": 1.3087814443276458e-05, "loss": 1.2856, "step": 15309 }, { "epoch": 0.42, "learning_rate": 1.3086973147200565e-05, "loss": 1.2642, "step": 15310 }, { "epoch": 0.42, "learning_rate": 1.3086131826973647e-05, "loss": 1.1931, "step": 15311 }, { "epoch": 0.42, "learning_rate": 1.3085290482602283e-05, "loss": 1.2517, "step": 15312 }, { "epoch": 0.42, "learning_rate": 1.3084449114093056e-05, "loss": 1.3193, "step": 15313 }, { "epoch": 0.42, "learning_rate": 1.308360772145255e-05, "loss": 1.4014, "step": 15314 }, { "epoch": 0.42, "learning_rate": 1.3082766304687346e-05, "loss": 1.2583, "step": 15315 }, { "epoch": 0.42, "learning_rate": 1.308192486380403e-05, "loss": 1.3691, "step": 15316 }, { "epoch": 0.42, "learning_rate": 1.3081083398809184e-05, "loss": 1.3618, "step": 15317 }, { "epoch": 0.42, "learning_rate": 1.3080241909709388e-05, "loss": 1.27, "step": 15318 }, { "epoch": 0.42, "learning_rate": 1.307940039651123e-05, "loss": 1.2234, "step": 15319 }, { "epoch": 0.42, "learning_rate": 1.3078558859221291e-05, "loss": 1.3516, "step": 15320 }, { "epoch": 0.42, "learning_rate": 1.3077717297846156e-05, "loss": 1.0806, "step": 15321 }, { "epoch": 0.42, "learning_rate": 1.3076875712392405e-05, "loss": 1.5088, "step": 15322 }, { "epoch": 0.42, "learning_rate": 1.3076034102866628e-05, "loss": 1.354, "step": 15323 }, { "epoch": 0.42, "learning_rate": 1.3075192469275404e-05, "loss": 1.2612, "step": 15324 }, { "epoch": 0.42, "learning_rate": 1.3074350811625323e-05, "loss": 1.3188, "step": 15325 }, { "epoch": 0.42, "learning_rate": 1.3073509129922966e-05, "loss": 1.3528, "step": 15326 }, { "epoch": 0.42, "learning_rate": 1.3072667424174919e-05, "loss": 1.2583, "step": 15327 }, { "epoch": 0.42, "learning_rate": 1.3071825694387765e-05, "loss": 1.3887, "step": 15328 }, { "epoch": 0.42, "learning_rate": 1.3070983940568094e-05, "loss": 1.4382, "step": 15329 }, { "epoch": 0.42, "learning_rate": 1.3070142162722485e-05, "loss": 1.3188, "step": 15330 }, { "epoch": 0.42, "learning_rate": 1.306930036085753e-05, "loss": 1.3271, "step": 15331 }, { "epoch": 0.42, "learning_rate": 1.3068458534979813e-05, "loss": 1.7207, "step": 15332 }, { "epoch": 0.42, "learning_rate": 1.3067616685095917e-05, "loss": 1.2788, "step": 15333 }, { "epoch": 0.42, "learning_rate": 1.3066774811212433e-05, "loss": 1.3809, "step": 15334 }, { "epoch": 0.42, "learning_rate": 1.3065932913335944e-05, "loss": 1.2776, "step": 15335 }, { "epoch": 0.42, "learning_rate": 1.3065090991473038e-05, "loss": 1.437, "step": 15336 }, { "epoch": 0.42, "learning_rate": 1.30642490456303e-05, "loss": 1.2385, "step": 15337 }, { "epoch": 0.42, "learning_rate": 1.3063407075814321e-05, "loss": 1.2048, "step": 15338 }, { "epoch": 0.42, "learning_rate": 1.3062565082031682e-05, "loss": 1.3208, "step": 15339 }, { "epoch": 0.42, "learning_rate": 1.3061723064288976e-05, "loss": 1.2847, "step": 15340 }, { "epoch": 0.42, "learning_rate": 1.3060881022592788e-05, "loss": 1.2676, "step": 15341 }, { "epoch": 0.42, "learning_rate": 1.3060038956949708e-05, "loss": 1.3936, "step": 15342 }, { "epoch": 0.42, "learning_rate": 1.305919686736632e-05, "loss": 1.3245, "step": 15343 }, { "epoch": 0.42, "learning_rate": 1.3058354753849214e-05, "loss": 1.2144, "step": 15344 }, { "epoch": 0.42, "learning_rate": 1.3057512616404977e-05, "loss": 1.3347, "step": 15345 }, { "epoch": 0.42, "learning_rate": 1.3056670455040204e-05, "loss": 1.3542, "step": 15346 }, { "epoch": 0.42, "learning_rate": 1.3055828269761475e-05, "loss": 1.3862, "step": 15347 }, { "epoch": 0.42, "learning_rate": 1.3054986060575383e-05, "loss": 1.7354, "step": 15348 }, { "epoch": 0.42, "learning_rate": 1.3054143827488516e-05, "loss": 1.2346, "step": 15349 }, { "epoch": 0.42, "learning_rate": 1.3053301570507466e-05, "loss": 1.3149, "step": 15350 }, { "epoch": 0.42, "learning_rate": 1.3052459289638819e-05, "loss": 1.1946, "step": 15351 }, { "epoch": 0.42, "learning_rate": 1.3051616984889168e-05, "loss": 1.3086, "step": 15352 }, { "epoch": 0.42, "learning_rate": 1.3050774656265098e-05, "loss": 1.2161, "step": 15353 }, { "epoch": 0.42, "learning_rate": 1.3049932303773202e-05, "loss": 1.325, "step": 15354 }, { "epoch": 0.42, "learning_rate": 1.304908992742007e-05, "loss": 1.1187, "step": 15355 }, { "epoch": 0.42, "learning_rate": 1.3048247527212294e-05, "loss": 1.333, "step": 15356 }, { "epoch": 0.42, "learning_rate": 1.3047405103156462e-05, "loss": 1.25, "step": 15357 }, { "epoch": 0.42, "learning_rate": 1.3046562655259164e-05, "loss": 1.3367, "step": 15358 }, { "epoch": 0.42, "learning_rate": 1.3045720183526994e-05, "loss": 1.4587, "step": 15359 }, { "epoch": 0.42, "learning_rate": 1.304487768796654e-05, "loss": 1.3022, "step": 15360 }, { "epoch": 0.42, "learning_rate": 1.3044035168584393e-05, "loss": 1.2969, "step": 15361 }, { "epoch": 0.42, "learning_rate": 1.3043192625387148e-05, "loss": 1.2661, "step": 15362 }, { "epoch": 0.42, "learning_rate": 1.3042350058381397e-05, "loss": 1.2773, "step": 15363 }, { "epoch": 0.42, "learning_rate": 1.3041507467573728e-05, "loss": 1.365, "step": 15364 }, { "epoch": 0.42, "learning_rate": 1.3040664852970735e-05, "loss": 1.3989, "step": 15365 }, { "epoch": 0.42, "learning_rate": 1.3039822214579013e-05, "loss": 1.1606, "step": 15366 }, { "epoch": 0.42, "learning_rate": 1.3038979552405146e-05, "loss": 1.2739, "step": 15367 }, { "epoch": 0.42, "learning_rate": 1.3038136866455734e-05, "loss": 1.3247, "step": 15368 }, { "epoch": 0.42, "learning_rate": 1.303729415673737e-05, "loss": 1.1746, "step": 15369 }, { "epoch": 0.42, "learning_rate": 1.3036451423256643e-05, "loss": 1.3406, "step": 15370 }, { "epoch": 0.42, "learning_rate": 1.3035608666020148e-05, "loss": 1.2876, "step": 15371 }, { "epoch": 0.42, "learning_rate": 1.303476588503448e-05, "loss": 1.2148, "step": 15372 }, { "epoch": 0.42, "learning_rate": 1.3033923080306228e-05, "loss": 1.1694, "step": 15373 }, { "epoch": 0.42, "learning_rate": 1.303308025184199e-05, "loss": 1.3562, "step": 15374 }, { "epoch": 0.42, "learning_rate": 1.3032237399648357e-05, "loss": 1.0319, "step": 15375 }, { "epoch": 0.42, "learning_rate": 1.3031394523731924e-05, "loss": 1.1875, "step": 15376 }, { "epoch": 0.42, "learning_rate": 1.3030551624099288e-05, "loss": 1.4531, "step": 15377 }, { "epoch": 0.42, "learning_rate": 1.302970870075704e-05, "loss": 1.3413, "step": 15378 }, { "epoch": 0.42, "learning_rate": 1.3028865753711778e-05, "loss": 1.3782, "step": 15379 }, { "epoch": 0.42, "learning_rate": 1.3028022782970089e-05, "loss": 1.4099, "step": 15380 }, { "epoch": 0.42, "learning_rate": 1.302717978853858e-05, "loss": 1.3511, "step": 15381 }, { "epoch": 0.42, "learning_rate": 1.3026336770423836e-05, "loss": 1.2393, "step": 15382 }, { "epoch": 0.42, "learning_rate": 1.3025493728632456e-05, "loss": 1.2551, "step": 15383 }, { "epoch": 0.42, "learning_rate": 1.3024650663171037e-05, "loss": 1.3643, "step": 15384 }, { "epoch": 0.42, "learning_rate": 1.3023807574046176e-05, "loss": 1.3987, "step": 15385 }, { "epoch": 0.42, "learning_rate": 1.3022964461264462e-05, "loss": 1.333, "step": 15386 }, { "epoch": 0.42, "learning_rate": 1.30221213248325e-05, "loss": 1.2986, "step": 15387 }, { "epoch": 0.42, "learning_rate": 1.3021278164756877e-05, "loss": 1.3867, "step": 15388 }, { "epoch": 0.42, "learning_rate": 1.30204349810442e-05, "loss": 1.3435, "step": 15389 }, { "epoch": 0.42, "learning_rate": 1.3019591773701055e-05, "loss": 1.3455, "step": 15390 }, { "epoch": 0.42, "learning_rate": 1.3018748542734046e-05, "loss": 1.427, "step": 15391 }, { "epoch": 0.42, "learning_rate": 1.3017905288149763e-05, "loss": 1.3372, "step": 15392 }, { "epoch": 0.42, "learning_rate": 1.3017062009954814e-05, "loss": 1.437, "step": 15393 }, { "epoch": 0.42, "learning_rate": 1.3016218708155789e-05, "loss": 1.2773, "step": 15394 }, { "epoch": 0.42, "learning_rate": 1.3015375382759287e-05, "loss": 1.3662, "step": 15395 }, { "epoch": 0.42, "learning_rate": 1.3014532033771908e-05, "loss": 1.2959, "step": 15396 }, { "epoch": 0.42, "learning_rate": 1.3013688661200245e-05, "loss": 1.6372, "step": 15397 }, { "epoch": 0.42, "learning_rate": 1.30128452650509e-05, "loss": 1.25, "step": 15398 }, { "epoch": 0.42, "learning_rate": 1.3012001845330473e-05, "loss": 1.2131, "step": 15399 }, { "epoch": 0.42, "learning_rate": 1.3011158402045556e-05, "loss": 1.2664, "step": 15400 }, { "epoch": 0.42, "learning_rate": 1.3010314935202755e-05, "loss": 1.231, "step": 15401 }, { "epoch": 0.42, "learning_rate": 1.3009471444808661e-05, "loss": 1.3098, "step": 15402 }, { "epoch": 0.42, "learning_rate": 1.3008627930869881e-05, "loss": 1.0796, "step": 15403 }, { "epoch": 0.42, "learning_rate": 1.300778439339301e-05, "loss": 1.4368, "step": 15404 }, { "epoch": 0.42, "learning_rate": 1.300694083238465e-05, "loss": 1.1638, "step": 15405 }, { "epoch": 0.42, "learning_rate": 1.3006097247851394e-05, "loss": 1.2095, "step": 15406 }, { "epoch": 0.42, "learning_rate": 1.3005253639799852e-05, "loss": 1.0593, "step": 15407 }, { "epoch": 0.42, "learning_rate": 1.3004410008236614e-05, "loss": 1.2314, "step": 15408 }, { "epoch": 0.42, "learning_rate": 1.3003566353168289e-05, "loss": 1.3638, "step": 15409 }, { "epoch": 0.42, "learning_rate": 1.300272267460147e-05, "loss": 1.2542, "step": 15410 }, { "epoch": 0.42, "learning_rate": 1.3001878972542764e-05, "loss": 1.2268, "step": 15411 }, { "epoch": 0.42, "learning_rate": 1.3001035246998765e-05, "loss": 1.3584, "step": 15412 }, { "epoch": 0.42, "learning_rate": 1.300019149797608e-05, "loss": 1.323, "step": 15413 }, { "epoch": 0.42, "learning_rate": 1.2999347725481307e-05, "loss": 1.1465, "step": 15414 }, { "epoch": 0.42, "learning_rate": 1.2998503929521048e-05, "loss": 1.1538, "step": 15415 }, { "epoch": 0.42, "learning_rate": 1.2997660110101904e-05, "loss": 1.4348, "step": 15416 }, { "epoch": 0.42, "learning_rate": 1.2996816267230476e-05, "loss": 1.2166, "step": 15417 }, { "epoch": 0.42, "learning_rate": 1.2995972400913368e-05, "loss": 1.3425, "step": 15418 }, { "epoch": 0.42, "learning_rate": 1.299512851115718e-05, "loss": 1.3901, "step": 15419 }, { "epoch": 0.42, "learning_rate": 1.2994284597968516e-05, "loss": 1.2063, "step": 15420 }, { "epoch": 0.42, "learning_rate": 1.2993440661353978e-05, "loss": 1.7476, "step": 15421 }, { "epoch": 0.42, "learning_rate": 1.2992596701320164e-05, "loss": 1.439, "step": 15422 }, { "epoch": 0.42, "learning_rate": 1.2991752717873682e-05, "loss": 1.344, "step": 15423 }, { "epoch": 0.42, "learning_rate": 1.2990908711021138e-05, "loss": 1.2905, "step": 15424 }, { "epoch": 0.42, "learning_rate": 1.2990064680769124e-05, "loss": 1.3101, "step": 15425 }, { "epoch": 0.42, "learning_rate": 1.2989220627124253e-05, "loss": 1.3589, "step": 15426 }, { "epoch": 0.42, "learning_rate": 1.2988376550093127e-05, "loss": 1.3784, "step": 15427 }, { "epoch": 0.42, "learning_rate": 1.2987532449682344e-05, "loss": 1.406, "step": 15428 }, { "epoch": 0.42, "learning_rate": 1.2986688325898518e-05, "loss": 1.238, "step": 15429 }, { "epoch": 0.42, "learning_rate": 1.2985844178748242e-05, "loss": 1.3503, "step": 15430 }, { "epoch": 0.42, "learning_rate": 1.2985000008238129e-05, "loss": 1.2065, "step": 15431 }, { "epoch": 0.42, "learning_rate": 1.2984155814374774e-05, "loss": 1.3347, "step": 15432 }, { "epoch": 0.42, "learning_rate": 1.2983311597164794e-05, "loss": 1.6655, "step": 15433 }, { "epoch": 0.42, "learning_rate": 1.298246735661478e-05, "loss": 1.3218, "step": 15434 }, { "epoch": 0.42, "learning_rate": 1.298162309273135e-05, "loss": 1.3381, "step": 15435 }, { "epoch": 0.42, "learning_rate": 1.2980778805521098e-05, "loss": 1.3582, "step": 15436 }, { "epoch": 0.42, "learning_rate": 1.2979934494990639e-05, "loss": 1.3262, "step": 15437 }, { "epoch": 0.42, "learning_rate": 1.297909016114657e-05, "loss": 1.4106, "step": 15438 }, { "epoch": 0.42, "learning_rate": 1.2978245803995502e-05, "loss": 1.2515, "step": 15439 }, { "epoch": 0.42, "learning_rate": 1.2977401423544041e-05, "loss": 1.3245, "step": 15440 }, { "epoch": 0.42, "learning_rate": 1.2976557019798788e-05, "loss": 1.3779, "step": 15441 }, { "epoch": 0.42, "learning_rate": 1.2975712592766355e-05, "loss": 1.3018, "step": 15442 }, { "epoch": 0.42, "learning_rate": 1.2974868142453343e-05, "loss": 1.3772, "step": 15443 }, { "epoch": 0.42, "learning_rate": 1.2974023668866364e-05, "loss": 1.2903, "step": 15444 }, { "epoch": 0.42, "learning_rate": 1.2973179172012023e-05, "loss": 1.4219, "step": 15445 }, { "epoch": 0.42, "learning_rate": 1.2972334651896925e-05, "loss": 1.3491, "step": 15446 }, { "epoch": 0.42, "learning_rate": 1.2971490108527677e-05, "loss": 1.3401, "step": 15447 }, { "epoch": 0.42, "learning_rate": 1.297064554191089e-05, "loss": 1.2788, "step": 15448 }, { "epoch": 0.42, "learning_rate": 1.2969800952053168e-05, "loss": 1.3486, "step": 15449 }, { "epoch": 0.42, "learning_rate": 1.2968956338961122e-05, "loss": 1.2761, "step": 15450 }, { "epoch": 0.42, "learning_rate": 1.2968111702641355e-05, "loss": 1.3921, "step": 15451 }, { "epoch": 0.42, "learning_rate": 1.296726704310048e-05, "loss": 1.4104, "step": 15452 }, { "epoch": 0.42, "learning_rate": 1.29664223603451e-05, "loss": 1.4521, "step": 15453 }, { "epoch": 0.42, "learning_rate": 1.2965577654381826e-05, "loss": 1.3789, "step": 15454 }, { "epoch": 0.42, "learning_rate": 1.2964732925217269e-05, "loss": 1.2466, "step": 15455 }, { "epoch": 0.42, "learning_rate": 1.2963888172858037e-05, "loss": 1.3491, "step": 15456 }, { "epoch": 0.42, "learning_rate": 1.2963043397310735e-05, "loss": 1.2725, "step": 15457 }, { "epoch": 0.42, "learning_rate": 1.2962198598581977e-05, "loss": 1.3408, "step": 15458 }, { "epoch": 0.42, "learning_rate": 1.2961353776678368e-05, "loss": 1.1653, "step": 15459 }, { "epoch": 0.42, "learning_rate": 1.2960508931606521e-05, "loss": 1.2715, "step": 15460 }, { "epoch": 0.42, "learning_rate": 1.2959664063373044e-05, "loss": 1.2488, "step": 15461 }, { "epoch": 0.42, "learning_rate": 1.2958819171984547e-05, "loss": 1.2754, "step": 15462 }, { "epoch": 0.42, "learning_rate": 1.295797425744764e-05, "loss": 1.4167, "step": 15463 }, { "epoch": 0.42, "learning_rate": 1.2957129319768935e-05, "loss": 1.3855, "step": 15464 }, { "epoch": 0.42, "learning_rate": 1.2956284358955037e-05, "loss": 1.3115, "step": 15465 }, { "epoch": 0.42, "learning_rate": 1.2955439375012566e-05, "loss": 1.2864, "step": 15466 }, { "epoch": 0.42, "learning_rate": 1.295459436794812e-05, "loss": 1.3337, "step": 15467 }, { "epoch": 0.42, "learning_rate": 1.2953749337768321e-05, "loss": 1.3789, "step": 15468 }, { "epoch": 0.42, "learning_rate": 1.2952904284479776e-05, "loss": 1.0936, "step": 15469 }, { "epoch": 0.42, "learning_rate": 1.2952059208089095e-05, "loss": 1.355, "step": 15470 }, { "epoch": 0.42, "learning_rate": 1.2951214108602892e-05, "loss": 1.4065, "step": 15471 }, { "epoch": 0.42, "learning_rate": 1.2950368986027779e-05, "loss": 1.2307, "step": 15472 }, { "epoch": 0.42, "learning_rate": 1.2949523840370364e-05, "loss": 1.3284, "step": 15473 }, { "epoch": 0.42, "learning_rate": 1.2948678671637264e-05, "loss": 1.603, "step": 15474 }, { "epoch": 0.42, "learning_rate": 1.2947833479835086e-05, "loss": 1.3699, "step": 15475 }, { "epoch": 0.42, "learning_rate": 1.2946988264970448e-05, "loss": 1.3091, "step": 15476 }, { "epoch": 0.42, "learning_rate": 1.2946143027049955e-05, "loss": 1.2576, "step": 15477 }, { "epoch": 0.42, "learning_rate": 1.294529776608023e-05, "loss": 1.4956, "step": 15478 }, { "epoch": 0.42, "learning_rate": 1.2944452482067877e-05, "loss": 1.3916, "step": 15479 }, { "epoch": 0.42, "learning_rate": 1.2943607175019514e-05, "loss": 1.292, "step": 15480 }, { "epoch": 0.42, "learning_rate": 1.2942761844941749e-05, "loss": 1.3191, "step": 15481 }, { "epoch": 0.42, "learning_rate": 1.2941916491841205e-05, "loss": 1.2773, "step": 15482 }, { "epoch": 0.42, "learning_rate": 1.2941071115724483e-05, "loss": 1.2261, "step": 15483 }, { "epoch": 0.42, "learning_rate": 1.2940225716598208e-05, "loss": 1.283, "step": 15484 }, { "epoch": 0.42, "learning_rate": 1.2939380294468989e-05, "loss": 1.3169, "step": 15485 }, { "epoch": 0.42, "learning_rate": 1.2938534849343438e-05, "loss": 1.1953, "step": 15486 }, { "epoch": 0.42, "learning_rate": 1.2937689381228176e-05, "loss": 1.1926, "step": 15487 }, { "epoch": 0.42, "learning_rate": 1.2936843890129811e-05, "loss": 1.2634, "step": 15488 }, { "epoch": 0.42, "learning_rate": 1.2935998376054962e-05, "loss": 1.4819, "step": 15489 }, { "epoch": 0.42, "learning_rate": 1.293515283901024e-05, "loss": 1.3159, "step": 15490 }, { "epoch": 0.42, "learning_rate": 1.2934307279002266e-05, "loss": 1.2358, "step": 15491 }, { "epoch": 0.42, "learning_rate": 1.293346169603765e-05, "loss": 1.3789, "step": 15492 }, { "epoch": 0.42, "learning_rate": 1.2932616090123009e-05, "loss": 1.2683, "step": 15493 }, { "epoch": 0.42, "learning_rate": 1.293177046126496e-05, "loss": 1.2949, "step": 15494 }, { "epoch": 0.42, "learning_rate": 1.2930924809470115e-05, "loss": 1.4021, "step": 15495 }, { "epoch": 0.42, "learning_rate": 1.2930079134745093e-05, "loss": 1.2035, "step": 15496 }, { "epoch": 0.42, "learning_rate": 1.292923343709651e-05, "loss": 1.2629, "step": 15497 }, { "epoch": 0.42, "learning_rate": 1.2928387716530982e-05, "loss": 1.3545, "step": 15498 }, { "epoch": 0.42, "learning_rate": 1.2927541973055129e-05, "loss": 1.1978, "step": 15499 }, { "epoch": 0.42, "learning_rate": 1.2926696206675558e-05, "loss": 1.3789, "step": 15500 }, { "epoch": 0.42, "learning_rate": 1.2925850417398896e-05, "loss": 1.1685, "step": 15501 }, { "epoch": 0.42, "learning_rate": 1.2925004605231753e-05, "loss": 1.1066, "step": 15502 }, { "epoch": 0.42, "learning_rate": 1.2924158770180753e-05, "loss": 1.3896, "step": 15503 }, { "epoch": 0.42, "learning_rate": 1.2923312912252509e-05, "loss": 1.3254, "step": 15504 }, { "epoch": 0.42, "learning_rate": 1.2922467031453639e-05, "loss": 1.136, "step": 15505 }, { "epoch": 0.42, "learning_rate": 1.292162112779076e-05, "loss": 1.3032, "step": 15506 }, { "epoch": 0.42, "learning_rate": 1.2920775201270495e-05, "loss": 1.1958, "step": 15507 }, { "epoch": 0.42, "learning_rate": 1.2919929251899453e-05, "loss": 1.3477, "step": 15508 }, { "epoch": 0.42, "learning_rate": 1.2919083279684262e-05, "loss": 1.4102, "step": 15509 }, { "epoch": 0.42, "learning_rate": 1.2918237284631535e-05, "loss": 1.3677, "step": 15510 }, { "epoch": 0.42, "learning_rate": 1.291739126674789e-05, "loss": 1.3726, "step": 15511 }, { "epoch": 0.42, "learning_rate": 1.2916545226039946e-05, "loss": 1.2473, "step": 15512 }, { "epoch": 0.42, "learning_rate": 1.2915699162514328e-05, "loss": 1.2969, "step": 15513 }, { "epoch": 0.42, "learning_rate": 1.291485307617765e-05, "loss": 1.2163, "step": 15514 }, { "epoch": 0.42, "learning_rate": 1.291400696703653e-05, "loss": 1.3418, "step": 15515 }, { "epoch": 0.42, "learning_rate": 1.2913160835097588e-05, "loss": 1.3833, "step": 15516 }, { "epoch": 0.42, "learning_rate": 1.291231468036745e-05, "loss": 1.3765, "step": 15517 }, { "epoch": 0.42, "learning_rate": 1.291146850285273e-05, "loss": 1.3445, "step": 15518 }, { "epoch": 0.42, "learning_rate": 1.291062230256005e-05, "loss": 1.3147, "step": 15519 }, { "epoch": 0.42, "learning_rate": 1.2909776079496028e-05, "loss": 1.3594, "step": 15520 }, { "epoch": 0.42, "learning_rate": 1.2908929833667288e-05, "loss": 1.3274, "step": 15521 }, { "epoch": 0.42, "learning_rate": 1.2908083565080448e-05, "loss": 1.3052, "step": 15522 }, { "epoch": 0.42, "learning_rate": 1.2907237273742131e-05, "loss": 1.2334, "step": 15523 }, { "epoch": 0.42, "learning_rate": 1.2906390959658954e-05, "loss": 1.4204, "step": 15524 }, { "epoch": 0.42, "learning_rate": 1.2905544622837542e-05, "loss": 1.219, "step": 15525 }, { "epoch": 0.42, "learning_rate": 1.2904698263284516e-05, "loss": 1.384, "step": 15526 }, { "epoch": 0.42, "learning_rate": 1.2903851881006496e-05, "loss": 1.4031, "step": 15527 }, { "epoch": 0.42, "learning_rate": 1.2903005476010104e-05, "loss": 1.4309, "step": 15528 }, { "epoch": 0.42, "learning_rate": 1.2902159048301965e-05, "loss": 1.3689, "step": 15529 }, { "epoch": 0.42, "learning_rate": 1.2901312597888693e-05, "loss": 1.2144, "step": 15530 }, { "epoch": 0.42, "learning_rate": 1.290046612477692e-05, "loss": 1.2239, "step": 15531 }, { "epoch": 0.42, "learning_rate": 1.2899619628973263e-05, "loss": 1.5811, "step": 15532 }, { "epoch": 0.42, "learning_rate": 1.2898773110484344e-05, "loss": 1.3306, "step": 15533 }, { "epoch": 0.42, "learning_rate": 1.289792656931679e-05, "loss": 1.2371, "step": 15534 }, { "epoch": 0.42, "learning_rate": 1.2897080005477217e-05, "loss": 1.3994, "step": 15535 }, { "epoch": 0.42, "learning_rate": 1.2896233418972258e-05, "loss": 1.324, "step": 15536 }, { "epoch": 0.42, "learning_rate": 1.2895386809808526e-05, "loss": 1.197, "step": 15537 }, { "epoch": 0.42, "learning_rate": 1.2894540177992652e-05, "loss": 1.1086, "step": 15538 }, { "epoch": 0.42, "learning_rate": 1.2893693523531252e-05, "loss": 1.1797, "step": 15539 }, { "epoch": 0.42, "learning_rate": 1.289284684643096e-05, "loss": 1.1997, "step": 15540 }, { "epoch": 0.42, "learning_rate": 1.2892000146698391e-05, "loss": 1.4104, "step": 15541 }, { "epoch": 0.42, "learning_rate": 1.2891153424340175e-05, "loss": 1.3208, "step": 15542 }, { "epoch": 0.42, "learning_rate": 1.2890306679362934e-05, "loss": 1.3237, "step": 15543 }, { "epoch": 0.42, "learning_rate": 1.2889459911773292e-05, "loss": 1.3364, "step": 15544 }, { "epoch": 0.42, "learning_rate": 1.2888613121577876e-05, "loss": 1.3855, "step": 15545 }, { "epoch": 0.42, "learning_rate": 1.2887766308783305e-05, "loss": 1.4692, "step": 15546 }, { "epoch": 0.42, "learning_rate": 1.2886919473396212e-05, "loss": 1.1741, "step": 15547 }, { "epoch": 0.42, "learning_rate": 1.2886072615423218e-05, "loss": 1.3303, "step": 15548 }, { "epoch": 0.42, "learning_rate": 1.2885225734870948e-05, "loss": 1.3535, "step": 15549 }, { "epoch": 0.42, "learning_rate": 1.288437883174603e-05, "loss": 1.3679, "step": 15550 }, { "epoch": 0.42, "learning_rate": 1.2883531906055087e-05, "loss": 1.2964, "step": 15551 }, { "epoch": 0.42, "learning_rate": 1.2882684957804746e-05, "loss": 1.3596, "step": 15552 }, { "epoch": 0.42, "learning_rate": 1.2881837987001634e-05, "loss": 1.3586, "step": 15553 }, { "epoch": 0.42, "learning_rate": 1.2880990993652379e-05, "loss": 1.22, "step": 15554 }, { "epoch": 0.42, "learning_rate": 1.2880143977763602e-05, "loss": 1.29, "step": 15555 }, { "epoch": 0.42, "learning_rate": 1.2879296939341935e-05, "loss": 1.3657, "step": 15556 }, { "epoch": 0.42, "learning_rate": 1.2878449878394e-05, "loss": 1.2927, "step": 15557 }, { "epoch": 0.42, "learning_rate": 1.2877602794926429e-05, "loss": 1.4143, "step": 15558 }, { "epoch": 0.42, "learning_rate": 1.2876755688945846e-05, "loss": 1.2683, "step": 15559 }, { "epoch": 0.42, "learning_rate": 1.287590856045888e-05, "loss": 1.3855, "step": 15560 }, { "epoch": 0.42, "learning_rate": 1.2875061409472156e-05, "loss": 1.3782, "step": 15561 }, { "epoch": 0.42, "learning_rate": 1.2874214235992306e-05, "loss": 1.395, "step": 15562 }, { "epoch": 0.43, "learning_rate": 1.2873367040025953e-05, "loss": 1.2883, "step": 15563 }, { "epoch": 0.43, "learning_rate": 1.2872519821579727e-05, "loss": 1.4419, "step": 15564 }, { "epoch": 0.43, "learning_rate": 1.287167258066026e-05, "loss": 1.7026, "step": 15565 }, { "epoch": 0.43, "learning_rate": 1.2870825317274175e-05, "loss": 1.2439, "step": 15566 }, { "epoch": 0.43, "learning_rate": 1.28699780314281e-05, "loss": 1.2788, "step": 15567 }, { "epoch": 0.43, "learning_rate": 1.2869130723128674e-05, "loss": 1.1882, "step": 15568 }, { "epoch": 0.43, "learning_rate": 1.2868283392382512e-05, "loss": 1.3835, "step": 15569 }, { "epoch": 0.43, "learning_rate": 1.2867436039196253e-05, "loss": 1.2891, "step": 15570 }, { "epoch": 0.43, "learning_rate": 1.2866588663576521e-05, "loss": 1.3625, "step": 15571 }, { "epoch": 0.43, "learning_rate": 1.2865741265529947e-05, "loss": 1.4065, "step": 15572 }, { "epoch": 0.43, "learning_rate": 1.286489384506316e-05, "loss": 1.3411, "step": 15573 }, { "epoch": 0.43, "learning_rate": 1.2864046402182793e-05, "loss": 1.115, "step": 15574 }, { "epoch": 0.43, "learning_rate": 1.286319893689547e-05, "loss": 1.4119, "step": 15575 }, { "epoch": 0.43, "learning_rate": 1.286235144920783e-05, "loss": 1.2832, "step": 15576 }, { "epoch": 0.43, "learning_rate": 1.2861503939126496e-05, "loss": 1.3215, "step": 15577 }, { "epoch": 0.43, "learning_rate": 1.2860656406658099e-05, "loss": 1.2429, "step": 15578 }, { "epoch": 0.43, "learning_rate": 1.2859808851809271e-05, "loss": 1.2332, "step": 15579 }, { "epoch": 0.43, "learning_rate": 1.2858961274586648e-05, "loss": 1.321, "step": 15580 }, { "epoch": 0.43, "learning_rate": 1.2858113674996853e-05, "loss": 1.5005, "step": 15581 }, { "epoch": 0.43, "learning_rate": 1.2857266053046523e-05, "loss": 1.3804, "step": 15582 }, { "epoch": 0.43, "learning_rate": 1.2856418408742283e-05, "loss": 1.3928, "step": 15583 }, { "epoch": 0.43, "learning_rate": 1.2855570742090773e-05, "loss": 1.6323, "step": 15584 }, { "epoch": 0.43, "learning_rate": 1.2854723053098617e-05, "loss": 1.3589, "step": 15585 }, { "epoch": 0.43, "learning_rate": 1.2853875341772453e-05, "loss": 1.1545, "step": 15586 }, { "epoch": 0.43, "learning_rate": 1.2853027608118906e-05, "loss": 1.3962, "step": 15587 }, { "epoch": 0.43, "learning_rate": 1.2852179852144618e-05, "loss": 1.238, "step": 15588 }, { "epoch": 0.43, "learning_rate": 1.285133207385621e-05, "loss": 1.1938, "step": 15589 }, { "epoch": 0.43, "learning_rate": 1.2850484273260326e-05, "loss": 1.3936, "step": 15590 }, { "epoch": 0.43, "learning_rate": 1.284963645036359e-05, "loss": 1.3386, "step": 15591 }, { "epoch": 0.43, "learning_rate": 1.2848788605172642e-05, "loss": 1.1897, "step": 15592 }, { "epoch": 0.43, "learning_rate": 1.284794073769411e-05, "loss": 1.2778, "step": 15593 }, { "epoch": 0.43, "learning_rate": 1.2847092847934627e-05, "loss": 1.2971, "step": 15594 }, { "epoch": 0.43, "learning_rate": 1.284624493590083e-05, "loss": 1.3477, "step": 15595 }, { "epoch": 0.43, "learning_rate": 1.284539700159935e-05, "loss": 1.3967, "step": 15596 }, { "epoch": 0.43, "learning_rate": 1.2844549045036821e-05, "loss": 1.2263, "step": 15597 }, { "epoch": 0.43, "learning_rate": 1.2843701066219879e-05, "loss": 1.3923, "step": 15598 }, { "epoch": 0.43, "learning_rate": 1.2842853065155158e-05, "loss": 1.3701, "step": 15599 }, { "epoch": 0.43, "learning_rate": 1.2842005041849291e-05, "loss": 1.3108, "step": 15600 }, { "epoch": 0.43, "learning_rate": 1.2841156996308914e-05, "loss": 1.2966, "step": 15601 }, { "epoch": 0.43, "learning_rate": 1.284030892854066e-05, "loss": 1.3984, "step": 15602 }, { "epoch": 0.43, "learning_rate": 1.2839460838551163e-05, "loss": 1.3066, "step": 15603 }, { "epoch": 0.43, "learning_rate": 1.283861272634706e-05, "loss": 1.2207, "step": 15604 }, { "epoch": 0.43, "learning_rate": 1.2837764591934986e-05, "loss": 1.2568, "step": 15605 }, { "epoch": 0.43, "learning_rate": 1.2836916435321576e-05, "loss": 1.6318, "step": 15606 }, { "epoch": 0.43, "learning_rate": 1.2836068256513467e-05, "loss": 1.1953, "step": 15607 }, { "epoch": 0.43, "learning_rate": 1.2835220055517294e-05, "loss": 1.2954, "step": 15608 }, { "epoch": 0.43, "learning_rate": 1.283437183233969e-05, "loss": 1.261, "step": 15609 }, { "epoch": 0.43, "learning_rate": 1.2833523586987293e-05, "loss": 1.2874, "step": 15610 }, { "epoch": 0.43, "learning_rate": 1.2832675319466743e-05, "loss": 1.2205, "step": 15611 }, { "epoch": 0.43, "learning_rate": 1.2831827029784672e-05, "loss": 1.4277, "step": 15612 }, { "epoch": 0.43, "learning_rate": 1.283097871794772e-05, "loss": 1.2166, "step": 15613 }, { "epoch": 0.43, "learning_rate": 1.2830130383962518e-05, "loss": 1.1577, "step": 15614 }, { "epoch": 0.43, "learning_rate": 1.282928202783571e-05, "loss": 1.293, "step": 15615 }, { "epoch": 0.43, "learning_rate": 1.2828433649573929e-05, "loss": 1.2769, "step": 15616 }, { "epoch": 0.43, "learning_rate": 1.2827585249183815e-05, "loss": 1.3606, "step": 15617 }, { "epoch": 0.43, "learning_rate": 1.2826736826671997e-05, "loss": 1.2209, "step": 15618 }, { "epoch": 0.43, "learning_rate": 1.2825888382045126e-05, "loss": 1.3147, "step": 15619 }, { "epoch": 0.43, "learning_rate": 1.2825039915309829e-05, "loss": 1.2988, "step": 15620 }, { "epoch": 0.43, "learning_rate": 1.2824191426472751e-05, "loss": 1.3701, "step": 15621 }, { "epoch": 0.43, "learning_rate": 1.2823342915540526e-05, "loss": 1.427, "step": 15622 }, { "epoch": 0.43, "learning_rate": 1.2822494382519794e-05, "loss": 1.2593, "step": 15623 }, { "epoch": 0.43, "learning_rate": 1.2821645827417193e-05, "loss": 1.2605, "step": 15624 }, { "epoch": 0.43, "learning_rate": 1.2820797250239361e-05, "loss": 1.4111, "step": 15625 }, { "epoch": 0.43, "learning_rate": 1.2819948650992937e-05, "loss": 1.241, "step": 15626 }, { "epoch": 0.43, "learning_rate": 1.2819100029684563e-05, "loss": 1.1758, "step": 15627 }, { "epoch": 0.43, "learning_rate": 1.2818251386320875e-05, "loss": 1.24, "step": 15628 }, { "epoch": 0.43, "learning_rate": 1.2817402720908516e-05, "loss": 1.4939, "step": 15629 }, { "epoch": 0.43, "learning_rate": 1.2816554033454118e-05, "loss": 1.3467, "step": 15630 }, { "epoch": 0.43, "learning_rate": 1.281570532396433e-05, "loss": 1.1631, "step": 15631 }, { "epoch": 0.43, "learning_rate": 1.2814856592445785e-05, "loss": 1.2849, "step": 15632 }, { "epoch": 0.43, "learning_rate": 1.281400783890513e-05, "loss": 1.3005, "step": 15633 }, { "epoch": 0.43, "learning_rate": 1.2813159063348995e-05, "loss": 1.3376, "step": 15634 }, { "epoch": 0.43, "learning_rate": 1.2812310265784031e-05, "loss": 1.3621, "step": 15635 }, { "epoch": 0.43, "learning_rate": 1.2811461446216871e-05, "loss": 1.3638, "step": 15636 }, { "epoch": 0.43, "learning_rate": 1.281061260465416e-05, "loss": 1.4141, "step": 15637 }, { "epoch": 0.43, "learning_rate": 1.2809763741102537e-05, "loss": 1.3809, "step": 15638 }, { "epoch": 0.43, "learning_rate": 1.2808914855568644e-05, "loss": 1.3804, "step": 15639 }, { "epoch": 0.43, "learning_rate": 1.280806594805912e-05, "loss": 1.4458, "step": 15640 }, { "epoch": 0.43, "learning_rate": 1.280721701858061e-05, "loss": 1.3506, "step": 15641 }, { "epoch": 0.43, "learning_rate": 1.2806368067139756e-05, "loss": 1.2932, "step": 15642 }, { "epoch": 0.43, "learning_rate": 1.2805519093743194e-05, "loss": 1.2405, "step": 15643 }, { "epoch": 0.43, "learning_rate": 1.2804670098397574e-05, "loss": 1.2295, "step": 15644 }, { "epoch": 0.43, "learning_rate": 1.280382108110953e-05, "loss": 1.363, "step": 15645 }, { "epoch": 0.43, "learning_rate": 1.2802972041885712e-05, "loss": 1.1758, "step": 15646 }, { "epoch": 0.43, "learning_rate": 1.2802122980732757e-05, "loss": 1.4727, "step": 15647 }, { "epoch": 0.43, "learning_rate": 1.2801273897657311e-05, "loss": 1.4111, "step": 15648 }, { "epoch": 0.43, "learning_rate": 1.2800424792666013e-05, "loss": 1.3799, "step": 15649 }, { "epoch": 0.43, "learning_rate": 1.2799575665765511e-05, "loss": 1.2192, "step": 15650 }, { "epoch": 0.43, "learning_rate": 1.2798726516962444e-05, "loss": 1.0728, "step": 15651 }, { "epoch": 0.43, "learning_rate": 1.2797877346263456e-05, "loss": 1.2834, "step": 15652 }, { "epoch": 0.43, "learning_rate": 1.279702815367519e-05, "loss": 1.4331, "step": 15653 }, { "epoch": 0.43, "learning_rate": 1.2796178939204295e-05, "loss": 1.2678, "step": 15654 }, { "epoch": 0.43, "learning_rate": 1.2795329702857408e-05, "loss": 1.2783, "step": 15655 }, { "epoch": 0.43, "learning_rate": 1.2794480444641175e-05, "loss": 1.2153, "step": 15656 }, { "epoch": 0.43, "learning_rate": 1.279363116456224e-05, "loss": 1.3254, "step": 15657 }, { "epoch": 0.43, "learning_rate": 1.2792781862627254e-05, "loss": 1.1379, "step": 15658 }, { "epoch": 0.43, "learning_rate": 1.2791932538842853e-05, "loss": 1.4067, "step": 15659 }, { "epoch": 0.43, "learning_rate": 1.2791083193215685e-05, "loss": 1.1931, "step": 15660 }, { "epoch": 0.43, "learning_rate": 1.2790233825752392e-05, "loss": 1.2122, "step": 15661 }, { "epoch": 0.43, "learning_rate": 1.2789384436459626e-05, "loss": 1.2258, "step": 15662 }, { "epoch": 0.43, "learning_rate": 1.2788535025344024e-05, "loss": 1.4434, "step": 15663 }, { "epoch": 0.43, "learning_rate": 1.2787685592412238e-05, "loss": 1.3123, "step": 15664 }, { "epoch": 0.43, "learning_rate": 1.278683613767091e-05, "loss": 1.3184, "step": 15665 }, { "epoch": 0.43, "learning_rate": 1.2785986661126685e-05, "loss": 1.3518, "step": 15666 }, { "epoch": 0.43, "learning_rate": 1.2785137162786212e-05, "loss": 1.1025, "step": 15667 }, { "epoch": 0.43, "learning_rate": 1.2784287642656137e-05, "loss": 1.2595, "step": 15668 }, { "epoch": 0.43, "learning_rate": 1.2783438100743101e-05, "loss": 1.3442, "step": 15669 }, { "epoch": 0.43, "learning_rate": 1.2782588537053757e-05, "loss": 1.209, "step": 15670 }, { "epoch": 0.43, "learning_rate": 1.2781738951594744e-05, "loss": 1.291, "step": 15671 }, { "epoch": 0.43, "learning_rate": 1.278088934437272e-05, "loss": 1.3762, "step": 15672 }, { "epoch": 0.43, "learning_rate": 1.2780039715394322e-05, "loss": 1.2717, "step": 15673 }, { "epoch": 0.43, "learning_rate": 1.27791900646662e-05, "loss": 1.3572, "step": 15674 }, { "epoch": 0.43, "learning_rate": 1.2778340392195003e-05, "loss": 1.2065, "step": 15675 }, { "epoch": 0.43, "learning_rate": 1.2777490697987378e-05, "loss": 1.2302, "step": 15676 }, { "epoch": 0.43, "learning_rate": 1.277664098204997e-05, "loss": 1.4104, "step": 15677 }, { "epoch": 0.43, "learning_rate": 1.277579124438943e-05, "loss": 1.3462, "step": 15678 }, { "epoch": 0.43, "learning_rate": 1.2774941485012406e-05, "loss": 1.4146, "step": 15679 }, { "epoch": 0.43, "learning_rate": 1.2774091703925544e-05, "loss": 1.3064, "step": 15680 }, { "epoch": 0.43, "learning_rate": 1.2773241901135492e-05, "loss": 1.3271, "step": 15681 }, { "epoch": 0.43, "learning_rate": 1.2772392076648899e-05, "loss": 1.3223, "step": 15682 }, { "epoch": 0.43, "learning_rate": 1.2771542230472413e-05, "loss": 1.2861, "step": 15683 }, { "epoch": 0.43, "learning_rate": 1.2770692362612686e-05, "loss": 1.2229, "step": 15684 }, { "epoch": 0.43, "learning_rate": 1.2769842473076364e-05, "loss": 1.1814, "step": 15685 }, { "epoch": 0.43, "learning_rate": 1.2768992561870097e-05, "loss": 1.4336, "step": 15686 }, { "epoch": 0.43, "learning_rate": 1.2768142629000535e-05, "loss": 1.3276, "step": 15687 }, { "epoch": 0.43, "learning_rate": 1.2767292674474325e-05, "loss": 1.1519, "step": 15688 }, { "epoch": 0.43, "learning_rate": 1.276644269829812e-05, "loss": 1.3257, "step": 15689 }, { "epoch": 0.43, "learning_rate": 1.2765592700478568e-05, "loss": 1.282, "step": 15690 }, { "epoch": 0.43, "learning_rate": 1.2764742681022318e-05, "loss": 1.2588, "step": 15691 }, { "epoch": 0.43, "learning_rate": 1.2763892639936022e-05, "loss": 1.3665, "step": 15692 }, { "epoch": 0.43, "learning_rate": 1.276304257722633e-05, "loss": 1.261, "step": 15693 }, { "epoch": 0.43, "learning_rate": 1.2762192492899893e-05, "loss": 1.2871, "step": 15694 }, { "epoch": 0.43, "learning_rate": 1.2761342386963357e-05, "loss": 1.7617, "step": 15695 }, { "epoch": 0.43, "learning_rate": 1.2760492259423382e-05, "loss": 1.3518, "step": 15696 }, { "epoch": 0.43, "learning_rate": 1.2759642110286609e-05, "loss": 1.405, "step": 15697 }, { "epoch": 0.43, "learning_rate": 1.2758791939559698e-05, "loss": 1.4541, "step": 15698 }, { "epoch": 0.43, "learning_rate": 1.2757941747249294e-05, "loss": 1.2854, "step": 15699 }, { "epoch": 0.43, "learning_rate": 1.2757091533362051e-05, "loss": 1.209, "step": 15700 }, { "epoch": 0.43, "learning_rate": 1.2756241297904619e-05, "loss": 1.3091, "step": 15701 }, { "epoch": 0.43, "learning_rate": 1.2755391040883651e-05, "loss": 1.2427, "step": 15702 }, { "epoch": 0.43, "learning_rate": 1.2754540762305802e-05, "loss": 1.344, "step": 15703 }, { "epoch": 0.43, "learning_rate": 1.275369046217772e-05, "loss": 1.3462, "step": 15704 }, { "epoch": 0.43, "learning_rate": 1.2752840140506058e-05, "loss": 1.3223, "step": 15705 }, { "epoch": 0.43, "learning_rate": 1.2751989797297469e-05, "loss": 1.282, "step": 15706 }, { "epoch": 0.43, "learning_rate": 1.2751139432558609e-05, "loss": 1.1277, "step": 15707 }, { "epoch": 0.43, "learning_rate": 1.2750289046296123e-05, "loss": 1.1377, "step": 15708 }, { "epoch": 0.43, "learning_rate": 1.274943863851667e-05, "loss": 1.3372, "step": 15709 }, { "epoch": 0.43, "learning_rate": 1.2748588209226905e-05, "loss": 1.4229, "step": 15710 }, { "epoch": 0.43, "learning_rate": 1.2747737758433477e-05, "loss": 1.3445, "step": 15711 }, { "epoch": 0.43, "learning_rate": 1.274688728614304e-05, "loss": 1.4099, "step": 15712 }, { "epoch": 0.43, "learning_rate": 1.2746036792362249e-05, "loss": 1.3198, "step": 15713 }, { "epoch": 0.43, "learning_rate": 1.2745186277097757e-05, "loss": 1.3711, "step": 15714 }, { "epoch": 0.43, "learning_rate": 1.274433574035622e-05, "loss": 1.3564, "step": 15715 }, { "epoch": 0.43, "learning_rate": 1.2743485182144286e-05, "loss": 1.1145, "step": 15716 }, { "epoch": 0.43, "learning_rate": 1.274263460246862e-05, "loss": 1.2913, "step": 15717 }, { "epoch": 0.43, "learning_rate": 1.2741784001335864e-05, "loss": 1.2913, "step": 15718 }, { "epoch": 0.43, "learning_rate": 1.2740933378752685e-05, "loss": 1.1655, "step": 15719 }, { "epoch": 0.43, "learning_rate": 1.2740082734725729e-05, "loss": 1.2517, "step": 15720 }, { "epoch": 0.43, "learning_rate": 1.2739232069261656e-05, "loss": 1.3013, "step": 15721 }, { "epoch": 0.43, "learning_rate": 1.273838138236712e-05, "loss": 1.3379, "step": 15722 }, { "epoch": 0.43, "learning_rate": 1.2737530674048775e-05, "loss": 1.5151, "step": 15723 }, { "epoch": 0.43, "learning_rate": 1.2736679944313276e-05, "loss": 1.4395, "step": 15724 }, { "epoch": 0.43, "learning_rate": 1.273582919316728e-05, "loss": 1.6792, "step": 15725 }, { "epoch": 0.43, "learning_rate": 1.2734978420617443e-05, "loss": 1.342, "step": 15726 }, { "epoch": 0.43, "learning_rate": 1.2734127626670422e-05, "loss": 1.3113, "step": 15727 }, { "epoch": 0.43, "learning_rate": 1.2733276811332873e-05, "loss": 1.3208, "step": 15728 }, { "epoch": 0.43, "learning_rate": 1.2732425974611451e-05, "loss": 1.4995, "step": 15729 }, { "epoch": 0.43, "learning_rate": 1.273157511651281e-05, "loss": 1.302, "step": 15730 }, { "epoch": 0.43, "learning_rate": 1.2730724237043614e-05, "loss": 1.3179, "step": 15731 }, { "epoch": 0.43, "learning_rate": 1.2729873336210512e-05, "loss": 1.1733, "step": 15732 }, { "epoch": 0.43, "learning_rate": 1.2729022414020165e-05, "loss": 1.2241, "step": 15733 }, { "epoch": 0.43, "learning_rate": 1.2728171470479231e-05, "loss": 1.3281, "step": 15734 }, { "epoch": 0.43, "learning_rate": 1.2727320505594367e-05, "loss": 1.3035, "step": 15735 }, { "epoch": 0.43, "learning_rate": 1.2726469519372229e-05, "loss": 1.343, "step": 15736 }, { "epoch": 0.43, "learning_rate": 1.2725618511819477e-05, "loss": 1.4192, "step": 15737 }, { "epoch": 0.43, "learning_rate": 1.2724767482942766e-05, "loss": 1.1365, "step": 15738 }, { "epoch": 0.43, "learning_rate": 1.2723916432748756e-05, "loss": 1.3918, "step": 15739 }, { "epoch": 0.43, "learning_rate": 1.2723065361244105e-05, "loss": 1.3367, "step": 15740 }, { "epoch": 0.43, "learning_rate": 1.2722214268435471e-05, "loss": 1.2527, "step": 15741 }, { "epoch": 0.43, "learning_rate": 1.2721363154329512e-05, "loss": 1.1421, "step": 15742 }, { "epoch": 0.43, "learning_rate": 1.2720512018932886e-05, "loss": 1.2695, "step": 15743 }, { "epoch": 0.43, "learning_rate": 1.2719660862252256e-05, "loss": 1.3794, "step": 15744 }, { "epoch": 0.43, "learning_rate": 1.2718809684294278e-05, "loss": 1.1914, "step": 15745 }, { "epoch": 0.43, "learning_rate": 1.271795848506561e-05, "loss": 1.3855, "step": 15746 }, { "epoch": 0.43, "learning_rate": 1.2717107264572914e-05, "loss": 1.7271, "step": 15747 }, { "epoch": 0.43, "learning_rate": 1.2716256022822849e-05, "loss": 1.2944, "step": 15748 }, { "epoch": 0.43, "learning_rate": 1.271540475982207e-05, "loss": 1.3579, "step": 15749 }, { "epoch": 0.43, "learning_rate": 1.2714553475577246e-05, "loss": 1.3469, "step": 15750 }, { "epoch": 0.43, "learning_rate": 1.271370217009503e-05, "loss": 1.3889, "step": 15751 }, { "epoch": 0.43, "learning_rate": 1.2712850843382086e-05, "loss": 1.3196, "step": 15752 }, { "epoch": 0.43, "learning_rate": 1.2711999495445068e-05, "loss": 1.2996, "step": 15753 }, { "epoch": 0.43, "learning_rate": 1.2711148126290646e-05, "loss": 1.5308, "step": 15754 }, { "epoch": 0.43, "learning_rate": 1.2710296735925476e-05, "loss": 1.2043, "step": 15755 }, { "epoch": 0.43, "learning_rate": 1.2709445324356217e-05, "loss": 1.4248, "step": 15756 }, { "epoch": 0.43, "learning_rate": 1.2708593891589531e-05, "loss": 1.2825, "step": 15757 }, { "epoch": 0.43, "learning_rate": 1.2707742437632083e-05, "loss": 1.219, "step": 15758 }, { "epoch": 0.43, "learning_rate": 1.2706890962490527e-05, "loss": 1.2537, "step": 15759 }, { "epoch": 0.43, "learning_rate": 1.2706039466171533e-05, "loss": 1.2542, "step": 15760 }, { "epoch": 0.43, "learning_rate": 1.2705187948681757e-05, "loss": 1.3132, "step": 15761 }, { "epoch": 0.43, "learning_rate": 1.2704336410027865e-05, "loss": 1.2036, "step": 15762 }, { "epoch": 0.43, "learning_rate": 1.2703484850216511e-05, "loss": 1.6821, "step": 15763 }, { "epoch": 0.43, "learning_rate": 1.2702633269254365e-05, "loss": 1.1807, "step": 15764 }, { "epoch": 0.43, "learning_rate": 1.2701781667148088e-05, "loss": 1.1738, "step": 15765 }, { "epoch": 0.43, "learning_rate": 1.2700930043904345e-05, "loss": 1.2961, "step": 15766 }, { "epoch": 0.43, "learning_rate": 1.270007839952979e-05, "loss": 1.3093, "step": 15767 }, { "epoch": 0.43, "learning_rate": 1.2699226734031096e-05, "loss": 1.3582, "step": 15768 }, { "epoch": 0.43, "learning_rate": 1.2698375047414917e-05, "loss": 1.2832, "step": 15769 }, { "epoch": 0.43, "learning_rate": 1.2697523339687923e-05, "loss": 1.3413, "step": 15770 }, { "epoch": 0.43, "learning_rate": 1.2696671610856774e-05, "loss": 1.3843, "step": 15771 }, { "epoch": 0.43, "learning_rate": 1.2695819860928136e-05, "loss": 1.2878, "step": 15772 }, { "epoch": 0.43, "learning_rate": 1.269496808990867e-05, "loss": 1.3718, "step": 15773 }, { "epoch": 0.43, "learning_rate": 1.269411629780504e-05, "loss": 1.2556, "step": 15774 }, { "epoch": 0.43, "learning_rate": 1.2693264484623913e-05, "loss": 1.3813, "step": 15775 }, { "epoch": 0.43, "learning_rate": 1.269241265037195e-05, "loss": 1.332, "step": 15776 }, { "epoch": 0.43, "learning_rate": 1.2691560795055815e-05, "loss": 1.3247, "step": 15777 }, { "epoch": 0.43, "learning_rate": 1.2690708918682177e-05, "loss": 1.3794, "step": 15778 }, { "epoch": 0.43, "learning_rate": 1.2689857021257694e-05, "loss": 1.2756, "step": 15779 }, { "epoch": 0.43, "learning_rate": 1.2689005102789036e-05, "loss": 1.2986, "step": 15780 }, { "epoch": 0.43, "learning_rate": 1.2688153163282866e-05, "loss": 1.7261, "step": 15781 }, { "epoch": 0.43, "learning_rate": 1.2687301202745853e-05, "loss": 1.2886, "step": 15782 }, { "epoch": 0.43, "learning_rate": 1.2686449221184653e-05, "loss": 1.3882, "step": 15783 }, { "epoch": 0.43, "learning_rate": 1.2685597218605944e-05, "loss": 1.3481, "step": 15784 }, { "epoch": 0.43, "learning_rate": 1.2684745195016382e-05, "loss": 1.3381, "step": 15785 }, { "epoch": 0.43, "learning_rate": 1.2683893150422638e-05, "loss": 1.3428, "step": 15786 }, { "epoch": 0.43, "learning_rate": 1.2683041084831374e-05, "loss": 1.3496, "step": 15787 }, { "epoch": 0.43, "learning_rate": 1.268218899824926e-05, "loss": 1.2749, "step": 15788 }, { "epoch": 0.43, "learning_rate": 1.2681336890682957e-05, "loss": 1.157, "step": 15789 }, { "epoch": 0.43, "learning_rate": 1.268048476213914e-05, "loss": 1.3867, "step": 15790 }, { "epoch": 0.43, "learning_rate": 1.2679632612624466e-05, "loss": 1.3901, "step": 15791 }, { "epoch": 0.43, "learning_rate": 1.2678780442145611e-05, "loss": 1.4253, "step": 15792 }, { "epoch": 0.43, "learning_rate": 1.2677928250709233e-05, "loss": 1.3235, "step": 15793 }, { "epoch": 0.43, "learning_rate": 1.2677076038322007e-05, "loss": 1.4707, "step": 15794 }, { "epoch": 0.43, "learning_rate": 1.2676223804990594e-05, "loss": 1.4048, "step": 15795 }, { "epoch": 0.43, "learning_rate": 1.2675371550721667e-05, "loss": 1.7676, "step": 15796 }, { "epoch": 0.43, "learning_rate": 1.267451927552189e-05, "loss": 1.4609, "step": 15797 }, { "epoch": 0.43, "learning_rate": 1.2673666979397931e-05, "loss": 1.3276, "step": 15798 }, { "epoch": 0.43, "learning_rate": 1.2672814662356461e-05, "loss": 1.3865, "step": 15799 }, { "epoch": 0.43, "learning_rate": 1.2671962324404143e-05, "loss": 1.282, "step": 15800 }, { "epoch": 0.43, "learning_rate": 1.2671109965547652e-05, "loss": 1.2336, "step": 15801 }, { "epoch": 0.43, "learning_rate": 1.2670257585793648e-05, "loss": 1.1816, "step": 15802 }, { "epoch": 0.43, "learning_rate": 1.2669405185148808e-05, "loss": 1.301, "step": 15803 }, { "epoch": 0.43, "learning_rate": 1.2668552763619797e-05, "loss": 1.731, "step": 15804 }, { "epoch": 0.43, "learning_rate": 1.2667700321213282e-05, "loss": 1.2808, "step": 15805 }, { "epoch": 0.43, "learning_rate": 1.2666847857935936e-05, "loss": 1.4192, "step": 15806 }, { "epoch": 0.43, "learning_rate": 1.2665995373794422e-05, "loss": 1.2334, "step": 15807 }, { "epoch": 0.43, "learning_rate": 1.266514286879542e-05, "loss": 1.4622, "step": 15808 }, { "epoch": 0.43, "learning_rate": 1.266429034294559e-05, "loss": 1.3298, "step": 15809 }, { "epoch": 0.43, "learning_rate": 1.2663437796251605e-05, "loss": 1.3191, "step": 15810 }, { "epoch": 0.43, "learning_rate": 1.2662585228720136e-05, "loss": 1.239, "step": 15811 }, { "epoch": 0.43, "learning_rate": 1.266173264035785e-05, "loss": 1.3147, "step": 15812 }, { "epoch": 0.43, "learning_rate": 1.2660880031171425e-05, "loss": 1.4214, "step": 15813 }, { "epoch": 0.43, "learning_rate": 1.266002740116752e-05, "loss": 1.1519, "step": 15814 }, { "epoch": 0.43, "learning_rate": 1.2659174750352816e-05, "loss": 1.3101, "step": 15815 }, { "epoch": 0.43, "learning_rate": 1.2658322078733976e-05, "loss": 1.2825, "step": 15816 }, { "epoch": 0.43, "learning_rate": 1.2657469386317676e-05, "loss": 1.4536, "step": 15817 }, { "epoch": 0.43, "learning_rate": 1.2656616673110585e-05, "loss": 1.183, "step": 15818 }, { "epoch": 0.43, "learning_rate": 1.2655763939119375e-05, "loss": 1.3936, "step": 15819 }, { "epoch": 0.43, "learning_rate": 1.2654911184350714e-05, "loss": 1.3169, "step": 15820 }, { "epoch": 0.43, "learning_rate": 1.2654058408811278e-05, "loss": 1.1484, "step": 15821 }, { "epoch": 0.43, "learning_rate": 1.2653205612507735e-05, "loss": 1.2793, "step": 15822 }, { "epoch": 0.43, "learning_rate": 1.2652352795446763e-05, "loss": 1.4617, "step": 15823 }, { "epoch": 0.43, "learning_rate": 1.2651499957635028e-05, "loss": 1.2759, "step": 15824 }, { "epoch": 0.43, "learning_rate": 1.2650647099079203e-05, "loss": 1.2739, "step": 15825 }, { "epoch": 0.43, "learning_rate": 1.264979421978596e-05, "loss": 1.1716, "step": 15826 }, { "epoch": 0.43, "learning_rate": 1.2648941319761975e-05, "loss": 1.4863, "step": 15827 }, { "epoch": 0.43, "learning_rate": 1.264808839901392e-05, "loss": 1.3472, "step": 15828 }, { "epoch": 0.43, "learning_rate": 1.2647235457548467e-05, "loss": 1.3291, "step": 15829 }, { "epoch": 0.43, "learning_rate": 1.2646382495372287e-05, "loss": 1.3064, "step": 15830 }, { "epoch": 0.43, "learning_rate": 1.2645529512492056e-05, "loss": 1.3845, "step": 15831 }, { "epoch": 0.43, "learning_rate": 1.2644676508914444e-05, "loss": 1.3174, "step": 15832 }, { "epoch": 0.43, "learning_rate": 1.2643823484646129e-05, "loss": 1.4883, "step": 15833 }, { "epoch": 0.43, "learning_rate": 1.264297043969378e-05, "loss": 1.2949, "step": 15834 }, { "epoch": 0.43, "learning_rate": 1.2642117374064077e-05, "loss": 1.292, "step": 15835 }, { "epoch": 0.43, "learning_rate": 1.2641264287763686e-05, "loss": 1.2231, "step": 15836 }, { "epoch": 0.43, "learning_rate": 1.2640411180799288e-05, "loss": 1.2075, "step": 15837 }, { "epoch": 0.43, "learning_rate": 1.2639558053177552e-05, "loss": 1.2917, "step": 15838 }, { "epoch": 0.43, "learning_rate": 1.2638704904905156e-05, "loss": 1.377, "step": 15839 }, { "epoch": 0.43, "learning_rate": 1.2637851735988773e-05, "loss": 1.2595, "step": 15840 }, { "epoch": 0.43, "learning_rate": 1.263699854643508e-05, "loss": 1.167, "step": 15841 }, { "epoch": 0.43, "learning_rate": 1.2636145336250747e-05, "loss": 1.1904, "step": 15842 }, { "epoch": 0.43, "learning_rate": 1.2635292105442457e-05, "loss": 1.1772, "step": 15843 }, { "epoch": 0.43, "learning_rate": 1.2634438854016877e-05, "loss": 1.323, "step": 15844 }, { "epoch": 0.43, "learning_rate": 1.263358558198069e-05, "loss": 1.333, "step": 15845 }, { "epoch": 0.43, "learning_rate": 1.2632732289340564e-05, "loss": 1.3027, "step": 15846 }, { "epoch": 0.43, "learning_rate": 1.263187897610318e-05, "loss": 1.2322, "step": 15847 }, { "epoch": 0.43, "learning_rate": 1.2631025642275212e-05, "loss": 1.3516, "step": 15848 }, { "epoch": 0.43, "learning_rate": 1.263017228786334e-05, "loss": 1.3706, "step": 15849 }, { "epoch": 0.43, "learning_rate": 1.2629318912874233e-05, "loss": 1.4856, "step": 15850 }, { "epoch": 0.43, "learning_rate": 1.2628465517314572e-05, "loss": 1.1372, "step": 15851 }, { "epoch": 0.43, "learning_rate": 1.2627612101191034e-05, "loss": 1.1814, "step": 15852 }, { "epoch": 0.43, "learning_rate": 1.2626758664510294e-05, "loss": 1.2993, "step": 15853 }, { "epoch": 0.43, "learning_rate": 1.2625905207279028e-05, "loss": 1.3665, "step": 15854 }, { "epoch": 0.43, "learning_rate": 1.2625051729503917e-05, "loss": 1.3652, "step": 15855 }, { "epoch": 0.43, "learning_rate": 1.2624198231191634e-05, "loss": 1.3394, "step": 15856 }, { "epoch": 0.43, "learning_rate": 1.2623344712348858e-05, "loss": 1.3389, "step": 15857 }, { "epoch": 0.43, "learning_rate": 1.2622491172982268e-05, "loss": 1.135, "step": 15858 }, { "epoch": 0.43, "learning_rate": 1.2621637613098537e-05, "loss": 1.2397, "step": 15859 }, { "epoch": 0.43, "learning_rate": 1.262078403270435e-05, "loss": 1.3311, "step": 15860 }, { "epoch": 0.43, "learning_rate": 1.2619930431806378e-05, "loss": 1.291, "step": 15861 }, { "epoch": 0.43, "learning_rate": 1.2619076810411303e-05, "loss": 1.3682, "step": 15862 }, { "epoch": 0.43, "learning_rate": 1.2618223168525802e-05, "loss": 1.3491, "step": 15863 }, { "epoch": 0.43, "learning_rate": 1.2617369506156558e-05, "loss": 1.3081, "step": 15864 }, { "epoch": 0.43, "learning_rate": 1.2616515823310242e-05, "loss": 1.4517, "step": 15865 }, { "epoch": 0.43, "learning_rate": 1.261566211999354e-05, "loss": 1.3333, "step": 15866 }, { "epoch": 0.43, "learning_rate": 1.2614808396213122e-05, "loss": 1.3418, "step": 15867 }, { "epoch": 0.43, "learning_rate": 1.2613954651975677e-05, "loss": 1.4033, "step": 15868 }, { "epoch": 0.43, "learning_rate": 1.261310088728788e-05, "loss": 1.4431, "step": 15869 }, { "epoch": 0.43, "learning_rate": 1.261224710215641e-05, "loss": 1.3735, "step": 15870 }, { "epoch": 0.43, "learning_rate": 1.2611393296587945e-05, "loss": 1.324, "step": 15871 }, { "epoch": 0.43, "learning_rate": 1.2610539470589167e-05, "loss": 1.3804, "step": 15872 }, { "epoch": 0.43, "learning_rate": 1.2609685624166754e-05, "loss": 1.2334, "step": 15873 }, { "epoch": 0.43, "learning_rate": 1.2608831757327393e-05, "loss": 1.2646, "step": 15874 }, { "epoch": 0.43, "learning_rate": 1.2607977870077757e-05, "loss": 1.3357, "step": 15875 }, { "epoch": 0.43, "learning_rate": 1.2607123962424528e-05, "loss": 1.3279, "step": 15876 }, { "epoch": 0.43, "learning_rate": 1.2606270034374385e-05, "loss": 1.4124, "step": 15877 }, { "epoch": 0.43, "learning_rate": 1.2605416085934015e-05, "loss": 1.2603, "step": 15878 }, { "epoch": 0.43, "learning_rate": 1.2604562117110093e-05, "loss": 1.3838, "step": 15879 }, { "epoch": 0.43, "learning_rate": 1.2603708127909301e-05, "loss": 1.189, "step": 15880 }, { "epoch": 0.43, "learning_rate": 1.2602854118338321e-05, "loss": 1.2063, "step": 15881 }, { "epoch": 0.43, "learning_rate": 1.2602000088403837e-05, "loss": 1.2969, "step": 15882 }, { "epoch": 0.43, "learning_rate": 1.2601146038112523e-05, "loss": 1.3779, "step": 15883 }, { "epoch": 0.43, "learning_rate": 1.260029196747107e-05, "loss": 1.2122, "step": 15884 }, { "epoch": 0.43, "learning_rate": 1.2599437876486154e-05, "loss": 1.4436, "step": 15885 }, { "epoch": 0.43, "learning_rate": 1.2598583765164458e-05, "loss": 1.3733, "step": 15886 }, { "epoch": 0.43, "learning_rate": 1.2597729633512662e-05, "loss": 1.4836, "step": 15887 }, { "epoch": 0.43, "learning_rate": 1.2596875481537454e-05, "loss": 1.3774, "step": 15888 }, { "epoch": 0.43, "learning_rate": 1.2596021309245512e-05, "loss": 1.2346, "step": 15889 }, { "epoch": 0.43, "learning_rate": 1.259516711664352e-05, "loss": 1.3215, "step": 15890 }, { "epoch": 0.43, "learning_rate": 1.2594312903738164e-05, "loss": 1.4419, "step": 15891 }, { "epoch": 0.43, "learning_rate": 1.259345867053612e-05, "loss": 1.2961, "step": 15892 }, { "epoch": 0.43, "learning_rate": 1.2592604417044076e-05, "loss": 1.3975, "step": 15893 }, { "epoch": 0.43, "learning_rate": 1.2591750143268717e-05, "loss": 1.3765, "step": 15894 }, { "epoch": 0.43, "learning_rate": 1.259089584921672e-05, "loss": 1.4797, "step": 15895 }, { "epoch": 0.43, "learning_rate": 1.2590041534894772e-05, "loss": 1.407, "step": 15896 }, { "epoch": 0.43, "learning_rate": 1.2589187200309559e-05, "loss": 1.3442, "step": 15897 }, { "epoch": 0.43, "learning_rate": 1.2588332845467763e-05, "loss": 1.2568, "step": 15898 }, { "epoch": 0.43, "learning_rate": 1.2587478470376067e-05, "loss": 1.3418, "step": 15899 }, { "epoch": 0.43, "learning_rate": 1.2586624075041156e-05, "loss": 1.157, "step": 15900 }, { "epoch": 0.43, "learning_rate": 1.2585769659469716e-05, "loss": 1.3867, "step": 15901 }, { "epoch": 0.43, "learning_rate": 1.2584915223668428e-05, "loss": 1.2781, "step": 15902 }, { "epoch": 0.43, "learning_rate": 1.2584060767643979e-05, "loss": 1.3674, "step": 15903 }, { "epoch": 0.43, "learning_rate": 1.2583206291403054e-05, "loss": 1.7471, "step": 15904 }, { "epoch": 0.43, "learning_rate": 1.2582351794952338e-05, "loss": 1.501, "step": 15905 }, { "epoch": 0.43, "learning_rate": 1.2581497278298516e-05, "loss": 1.6948, "step": 15906 }, { "epoch": 0.43, "learning_rate": 1.2580642741448274e-05, "loss": 1.2188, "step": 15907 }, { "epoch": 0.43, "learning_rate": 1.2579788184408295e-05, "loss": 1.3911, "step": 15908 }, { "epoch": 0.43, "learning_rate": 1.257893360718527e-05, "loss": 1.3413, "step": 15909 }, { "epoch": 0.43, "learning_rate": 1.2578079009785875e-05, "loss": 1.2617, "step": 15910 }, { "epoch": 0.43, "learning_rate": 1.2577224392216807e-05, "loss": 1.3909, "step": 15911 }, { "epoch": 0.43, "learning_rate": 1.2576369754484742e-05, "loss": 1.3474, "step": 15912 }, { "epoch": 0.43, "learning_rate": 1.2575515096596377e-05, "loss": 1.2073, "step": 15913 }, { "epoch": 0.43, "learning_rate": 1.2574660418558392e-05, "loss": 1.3975, "step": 15914 }, { "epoch": 0.43, "learning_rate": 1.2573805720377475e-05, "loss": 1.4365, "step": 15915 }, { "epoch": 0.43, "learning_rate": 1.257295100206031e-05, "loss": 1.2139, "step": 15916 }, { "epoch": 0.43, "learning_rate": 1.2572096263613589e-05, "loss": 1.3767, "step": 15917 }, { "epoch": 0.43, "learning_rate": 1.2571241505043994e-05, "loss": 1.2852, "step": 15918 }, { "epoch": 0.43, "learning_rate": 1.2570386726358212e-05, "loss": 1.7646, "step": 15919 }, { "epoch": 0.43, "learning_rate": 1.2569531927562936e-05, "loss": 1.2412, "step": 15920 }, { "epoch": 0.43, "learning_rate": 1.2568677108664851e-05, "loss": 1.1616, "step": 15921 }, { "epoch": 0.43, "learning_rate": 1.2567822269670644e-05, "loss": 1.501, "step": 15922 }, { "epoch": 0.43, "learning_rate": 1.2566967410587003e-05, "loss": 1.3064, "step": 15923 }, { "epoch": 0.43, "learning_rate": 1.2566112531420615e-05, "loss": 1.3716, "step": 15924 }, { "epoch": 0.43, "learning_rate": 1.2565257632178172e-05, "loss": 1.0391, "step": 15925 }, { "epoch": 0.43, "learning_rate": 1.2564402712866357e-05, "loss": 1.2598, "step": 15926 }, { "epoch": 0.43, "learning_rate": 1.2563547773491862e-05, "loss": 1.3806, "step": 15927 }, { "epoch": 0.43, "learning_rate": 1.2562692814061372e-05, "loss": 1.3647, "step": 15928 }, { "epoch": 0.44, "learning_rate": 1.2561837834581585e-05, "loss": 1.1816, "step": 15929 }, { "epoch": 0.44, "learning_rate": 1.2560982835059177e-05, "loss": 1.1543, "step": 15930 }, { "epoch": 0.44, "learning_rate": 1.2560127815500847e-05, "loss": 1.7344, "step": 15931 }, { "epoch": 0.44, "learning_rate": 1.2559272775913278e-05, "loss": 1.2864, "step": 15932 }, { "epoch": 0.44, "learning_rate": 1.2558417716303166e-05, "loss": 1.2185, "step": 15933 }, { "epoch": 0.44, "learning_rate": 1.2557562636677195e-05, "loss": 1.321, "step": 15934 }, { "epoch": 0.44, "learning_rate": 1.2556707537042054e-05, "loss": 1.3782, "step": 15935 }, { "epoch": 0.44, "learning_rate": 1.2555852417404438e-05, "loss": 1.4514, "step": 15936 }, { "epoch": 0.44, "learning_rate": 1.2554997277771036e-05, "loss": 1.2451, "step": 15937 }, { "epoch": 0.44, "learning_rate": 1.2554142118148533e-05, "loss": 1.2937, "step": 15938 }, { "epoch": 0.44, "learning_rate": 1.2553286938543624e-05, "loss": 1.27, "step": 15939 }, { "epoch": 0.44, "learning_rate": 1.2552431738963e-05, "loss": 1.3608, "step": 15940 }, { "epoch": 0.44, "learning_rate": 1.2551576519413352e-05, "loss": 1.3765, "step": 15941 }, { "epoch": 0.44, "learning_rate": 1.2550721279901366e-05, "loss": 1.2887, "step": 15942 }, { "epoch": 0.44, "learning_rate": 1.2549866020433738e-05, "loss": 1.356, "step": 15943 }, { "epoch": 0.44, "learning_rate": 1.2549010741017159e-05, "loss": 1.3647, "step": 15944 }, { "epoch": 0.44, "learning_rate": 1.2548155441658313e-05, "loss": 1.155, "step": 15945 }, { "epoch": 0.44, "learning_rate": 1.2547300122363902e-05, "loss": 1.2893, "step": 15946 }, { "epoch": 0.44, "learning_rate": 1.2546444783140613e-05, "loss": 1.3535, "step": 15947 }, { "epoch": 0.44, "learning_rate": 1.2545589423995134e-05, "loss": 1.3735, "step": 15948 }, { "epoch": 0.44, "learning_rate": 1.2544734044934161e-05, "loss": 1.3164, "step": 15949 }, { "epoch": 0.44, "learning_rate": 1.2543878645964387e-05, "loss": 1.4775, "step": 15950 }, { "epoch": 0.44, "learning_rate": 1.25430232270925e-05, "loss": 1.4487, "step": 15951 }, { "epoch": 0.44, "learning_rate": 1.2542167788325198e-05, "loss": 1.27, "step": 15952 }, { "epoch": 0.44, "learning_rate": 1.2541312329669171e-05, "loss": 1.3936, "step": 15953 }, { "epoch": 0.44, "learning_rate": 1.2540456851131109e-05, "loss": 1.3118, "step": 15954 }, { "epoch": 0.44, "learning_rate": 1.253960135271771e-05, "loss": 1.2297, "step": 15955 }, { "epoch": 0.44, "learning_rate": 1.2538745834435659e-05, "loss": 1.1277, "step": 15956 }, { "epoch": 0.44, "learning_rate": 1.2537890296291659e-05, "loss": 1.2983, "step": 15957 }, { "epoch": 0.44, "learning_rate": 1.2537034738292397e-05, "loss": 1.2412, "step": 15958 }, { "epoch": 0.44, "learning_rate": 1.253617916044457e-05, "loss": 1.1548, "step": 15959 }, { "epoch": 0.44, "learning_rate": 1.2535323562754868e-05, "loss": 1.3804, "step": 15960 }, { "epoch": 0.44, "learning_rate": 1.2534467945229988e-05, "loss": 1.3274, "step": 15961 }, { "epoch": 0.44, "learning_rate": 1.2533612307876621e-05, "loss": 1.23, "step": 15962 }, { "epoch": 0.44, "learning_rate": 1.2532756650701465e-05, "loss": 1.2295, "step": 15963 }, { "epoch": 0.44, "learning_rate": 1.2531900973711211e-05, "loss": 1.4302, "step": 15964 }, { "epoch": 0.44, "learning_rate": 1.2531045276912552e-05, "loss": 1.3333, "step": 15965 }, { "epoch": 0.44, "learning_rate": 1.2530189560312187e-05, "loss": 1.3333, "step": 15966 }, { "epoch": 0.44, "learning_rate": 1.2529333823916807e-05, "loss": 1.4185, "step": 15967 }, { "epoch": 0.44, "learning_rate": 1.2528478067733112e-05, "loss": 1.2632, "step": 15968 }, { "epoch": 0.44, "learning_rate": 1.2527622291767792e-05, "loss": 1.3452, "step": 15969 }, { "epoch": 0.44, "learning_rate": 1.2526766496027543e-05, "loss": 1.1982, "step": 15970 }, { "epoch": 0.44, "learning_rate": 1.252591068051906e-05, "loss": 1.4922, "step": 15971 }, { "epoch": 0.44, "learning_rate": 1.2525054845249042e-05, "loss": 1.2983, "step": 15972 }, { "epoch": 0.44, "learning_rate": 1.2524198990224181e-05, "loss": 1.2942, "step": 15973 }, { "epoch": 0.44, "learning_rate": 1.2523343115451177e-05, "loss": 1.3618, "step": 15974 }, { "epoch": 0.44, "learning_rate": 1.2522487220936718e-05, "loss": 1.2446, "step": 15975 }, { "epoch": 0.44, "learning_rate": 1.252163130668751e-05, "loss": 1.1343, "step": 15976 }, { "epoch": 0.44, "learning_rate": 1.2520775372710242e-05, "loss": 1.3394, "step": 15977 }, { "epoch": 0.44, "learning_rate": 1.2519919419011612e-05, "loss": 1.2642, "step": 15978 }, { "epoch": 0.44, "learning_rate": 1.2519063445598317e-05, "loss": 1.2961, "step": 15979 }, { "epoch": 0.44, "learning_rate": 1.2518207452477056e-05, "loss": 1.3357, "step": 15980 }, { "epoch": 0.44, "learning_rate": 1.2517351439654522e-05, "loss": 1.2556, "step": 15981 }, { "epoch": 0.44, "learning_rate": 1.2516495407137415e-05, "loss": 1.4368, "step": 15982 }, { "epoch": 0.44, "learning_rate": 1.2515639354932432e-05, "loss": 1.2927, "step": 15983 }, { "epoch": 0.44, "learning_rate": 1.251478328304627e-05, "loss": 1.3149, "step": 15984 }, { "epoch": 0.44, "learning_rate": 1.2513927191485624e-05, "loss": 1.3162, "step": 15985 }, { "epoch": 0.44, "learning_rate": 1.2513071080257198e-05, "loss": 1.2859, "step": 15986 }, { "epoch": 0.44, "learning_rate": 1.251221494936768e-05, "loss": 1.3247, "step": 15987 }, { "epoch": 0.44, "learning_rate": 1.2511358798823778e-05, "loss": 1.365, "step": 15988 }, { "epoch": 0.44, "learning_rate": 1.2510502628632182e-05, "loss": 1.2014, "step": 15989 }, { "epoch": 0.44, "learning_rate": 1.2509646438799598e-05, "loss": 1.3423, "step": 15990 }, { "epoch": 0.44, "learning_rate": 1.2508790229332718e-05, "loss": 1.1115, "step": 15991 }, { "epoch": 0.44, "learning_rate": 1.2507934000238244e-05, "loss": 1.3826, "step": 15992 }, { "epoch": 0.44, "learning_rate": 1.2507077751522872e-05, "loss": 1.3523, "step": 15993 }, { "epoch": 0.44, "learning_rate": 1.2506221483193306e-05, "loss": 1.3694, "step": 15994 }, { "epoch": 0.44, "learning_rate": 1.2505365195256237e-05, "loss": 1.2708, "step": 15995 }, { "epoch": 0.44, "learning_rate": 1.2504508887718375e-05, "loss": 1.3638, "step": 15996 }, { "epoch": 0.44, "learning_rate": 1.2503652560586404e-05, "loss": 1.3076, "step": 15997 }, { "epoch": 0.44, "learning_rate": 1.250279621386704e-05, "loss": 1.3044, "step": 15998 }, { "epoch": 0.44, "learning_rate": 1.250193984756697e-05, "loss": 1.26, "step": 15999 }, { "epoch": 0.44, "learning_rate": 1.2501083461692904e-05, "loss": 1.248, "step": 16000 }, { "epoch": 0.44, "learning_rate": 1.2500227056251534e-05, "loss": 1.5654, "step": 16001 }, { "epoch": 0.44, "learning_rate": 1.2499370631249568e-05, "loss": 1.2866, "step": 16002 }, { "epoch": 0.44, "learning_rate": 1.2498514186693697e-05, "loss": 1.1948, "step": 16003 }, { "epoch": 0.44, "learning_rate": 1.2497657722590629e-05, "loss": 1.3813, "step": 16004 }, { "epoch": 0.44, "learning_rate": 1.2496801238947059e-05, "loss": 1.14, "step": 16005 }, { "epoch": 0.44, "learning_rate": 1.249594473576969e-05, "loss": 1.2566, "step": 16006 }, { "epoch": 0.44, "learning_rate": 1.2495088213065223e-05, "loss": 1.2261, "step": 16007 }, { "epoch": 0.44, "learning_rate": 1.2494231670840361e-05, "loss": 1.2854, "step": 16008 }, { "epoch": 0.44, "learning_rate": 1.2493375109101802e-05, "loss": 1.3411, "step": 16009 }, { "epoch": 0.44, "learning_rate": 1.249251852785625e-05, "loss": 1.1125, "step": 16010 }, { "epoch": 0.44, "learning_rate": 1.2491661927110401e-05, "loss": 1.303, "step": 16011 }, { "epoch": 0.44, "learning_rate": 1.2490805306870963e-05, "loss": 1.3447, "step": 16012 }, { "epoch": 0.44, "learning_rate": 1.2489948667144639e-05, "loss": 1.1843, "step": 16013 }, { "epoch": 0.44, "learning_rate": 1.2489092007938122e-05, "loss": 1.4346, "step": 16014 }, { "epoch": 0.44, "learning_rate": 1.2488235329258125e-05, "loss": 1.3452, "step": 16015 }, { "epoch": 0.44, "learning_rate": 1.248737863111134e-05, "loss": 1.2927, "step": 16016 }, { "epoch": 0.44, "learning_rate": 1.2486521913504477e-05, "loss": 1.2437, "step": 16017 }, { "epoch": 0.44, "learning_rate": 1.2485665176444235e-05, "loss": 1.3044, "step": 16018 }, { "epoch": 0.44, "learning_rate": 1.2484808419937317e-05, "loss": 1.2219, "step": 16019 }, { "epoch": 0.44, "learning_rate": 1.2483951643990426e-05, "loss": 1.0867, "step": 16020 }, { "epoch": 0.44, "learning_rate": 1.248309484861027e-05, "loss": 1.3003, "step": 16021 }, { "epoch": 0.44, "learning_rate": 1.2482238033803543e-05, "loss": 1.2051, "step": 16022 }, { "epoch": 0.44, "learning_rate": 1.2481381199576955e-05, "loss": 1.3765, "step": 16023 }, { "epoch": 0.44, "learning_rate": 1.2480524345937205e-05, "loss": 1.3091, "step": 16024 }, { "epoch": 0.44, "learning_rate": 1.2479667472891e-05, "loss": 1.3396, "step": 16025 }, { "epoch": 0.44, "learning_rate": 1.247881058044504e-05, "loss": 1.4658, "step": 16026 }, { "epoch": 0.44, "learning_rate": 1.2477953668606038e-05, "loss": 1.2737, "step": 16027 }, { "epoch": 0.44, "learning_rate": 1.2477096737380684e-05, "loss": 1.0895, "step": 16028 }, { "epoch": 0.44, "learning_rate": 1.2476239786775695e-05, "loss": 1.2637, "step": 16029 }, { "epoch": 0.44, "learning_rate": 1.2475382816797767e-05, "loss": 1.3081, "step": 16030 }, { "epoch": 0.44, "learning_rate": 1.2474525827453612e-05, "loss": 1.3687, "step": 16031 }, { "epoch": 0.44, "learning_rate": 1.2473668818749927e-05, "loss": 1.228, "step": 16032 }, { "epoch": 0.44, "learning_rate": 1.2472811790693424e-05, "loss": 1.2446, "step": 16033 }, { "epoch": 0.44, "learning_rate": 1.2471954743290803e-05, "loss": 1.1902, "step": 16034 }, { "epoch": 0.44, "learning_rate": 1.247109767654877e-05, "loss": 1.2273, "step": 16035 }, { "epoch": 0.44, "learning_rate": 1.2470240590474029e-05, "loss": 1.3062, "step": 16036 }, { "epoch": 0.44, "learning_rate": 1.246938348507329e-05, "loss": 1.3369, "step": 16037 }, { "epoch": 0.44, "learning_rate": 1.2468526360353254e-05, "loss": 1.3647, "step": 16038 }, { "epoch": 0.44, "learning_rate": 1.246766921632063e-05, "loss": 1.2339, "step": 16039 }, { "epoch": 0.44, "learning_rate": 1.246681205298212e-05, "loss": 1.3599, "step": 16040 }, { "epoch": 0.44, "learning_rate": 1.2465954870344437e-05, "loss": 1.198, "step": 16041 }, { "epoch": 0.44, "learning_rate": 1.2465097668414279e-05, "loss": 1.2185, "step": 16042 }, { "epoch": 0.44, "learning_rate": 1.2464240447198356e-05, "loss": 1.2942, "step": 16043 }, { "epoch": 0.44, "learning_rate": 1.2463383206703373e-05, "loss": 1.3708, "step": 16044 }, { "epoch": 0.44, "learning_rate": 1.2462525946936041e-05, "loss": 1.3308, "step": 16045 }, { "epoch": 0.44, "learning_rate": 1.2461668667903062e-05, "loss": 1.3689, "step": 16046 }, { "epoch": 0.44, "learning_rate": 1.2460811369611147e-05, "loss": 1.3723, "step": 16047 }, { "epoch": 0.44, "learning_rate": 1.2459954052067e-05, "loss": 1.2566, "step": 16048 }, { "epoch": 0.44, "learning_rate": 1.245909671527733e-05, "loss": 1.1675, "step": 16049 }, { "epoch": 0.44, "learning_rate": 1.2458239359248842e-05, "loss": 1.2935, "step": 16050 }, { "epoch": 0.44, "learning_rate": 1.2457381983988248e-05, "loss": 1.2024, "step": 16051 }, { "epoch": 0.44, "learning_rate": 1.245652458950225e-05, "loss": 1.3208, "step": 16052 }, { "epoch": 0.44, "learning_rate": 1.2455667175797563e-05, "loss": 1.3862, "step": 16053 }, { "epoch": 0.44, "learning_rate": 1.2454809742880886e-05, "loss": 1.2288, "step": 16054 }, { "epoch": 0.44, "learning_rate": 1.2453952290758935e-05, "loss": 1.4709, "step": 16055 }, { "epoch": 0.44, "learning_rate": 1.2453094819438411e-05, "loss": 1.3337, "step": 16056 }, { "epoch": 0.44, "learning_rate": 1.2452237328926033e-05, "loss": 1.2578, "step": 16057 }, { "epoch": 0.44, "learning_rate": 1.2451379819228498e-05, "loss": 1.3093, "step": 16058 }, { "epoch": 0.44, "learning_rate": 1.245052229035252e-05, "loss": 1.2722, "step": 16059 }, { "epoch": 0.44, "learning_rate": 1.2449664742304813e-05, "loss": 1.334, "step": 16060 }, { "epoch": 0.44, "learning_rate": 1.2448807175092075e-05, "loss": 1.1504, "step": 16061 }, { "epoch": 0.44, "learning_rate": 1.2447949588721025e-05, "loss": 1.4292, "step": 16062 }, { "epoch": 0.44, "learning_rate": 1.2447091983198368e-05, "loss": 1.2788, "step": 16063 }, { "epoch": 0.44, "learning_rate": 1.2446234358530813e-05, "loss": 1.1924, "step": 16064 }, { "epoch": 0.44, "learning_rate": 1.244537671472507e-05, "loss": 1.2383, "step": 16065 }, { "epoch": 0.44, "learning_rate": 1.2444519051787853e-05, "loss": 1.2573, "step": 16066 }, { "epoch": 0.44, "learning_rate": 1.2443661369725866e-05, "loss": 1.3296, "step": 16067 }, { "epoch": 0.44, "learning_rate": 1.2442803668545823e-05, "loss": 1.1873, "step": 16068 }, { "epoch": 0.44, "learning_rate": 1.2441945948254428e-05, "loss": 1.3757, "step": 16069 }, { "epoch": 0.44, "learning_rate": 1.2441088208858398e-05, "loss": 1.355, "step": 16070 }, { "epoch": 0.44, "learning_rate": 1.2440230450364445e-05, "loss": 1.4038, "step": 16071 }, { "epoch": 0.44, "learning_rate": 1.2439372672779273e-05, "loss": 1.2676, "step": 16072 }, { "epoch": 0.44, "learning_rate": 1.2438514876109599e-05, "loss": 1.2377, "step": 16073 }, { "epoch": 0.44, "learning_rate": 1.243765706036213e-05, "loss": 1.3301, "step": 16074 }, { "epoch": 0.44, "learning_rate": 1.243679922554358e-05, "loss": 1.387, "step": 16075 }, { "epoch": 0.44, "learning_rate": 1.2435941371660655e-05, "loss": 1.4036, "step": 16076 }, { "epoch": 0.44, "learning_rate": 1.2435083498720073e-05, "loss": 1.2205, "step": 16077 }, { "epoch": 0.44, "learning_rate": 1.2434225606728543e-05, "loss": 1.4067, "step": 16078 }, { "epoch": 0.44, "learning_rate": 1.2433367695692774e-05, "loss": 1.0767, "step": 16079 }, { "epoch": 0.44, "learning_rate": 1.2432509765619484e-05, "loss": 1.3557, "step": 16080 }, { "epoch": 0.44, "learning_rate": 1.243165181651538e-05, "loss": 1.2058, "step": 16081 }, { "epoch": 0.44, "learning_rate": 1.2430793848387177e-05, "loss": 1.3145, "step": 16082 }, { "epoch": 0.44, "learning_rate": 1.2429935861241583e-05, "loss": 1.1609, "step": 16083 }, { "epoch": 0.44, "learning_rate": 1.2429077855085317e-05, "loss": 1.2563, "step": 16084 }, { "epoch": 0.44, "learning_rate": 1.2428219829925083e-05, "loss": 1.3315, "step": 16085 }, { "epoch": 0.44, "learning_rate": 1.2427361785767604e-05, "loss": 1.3323, "step": 16086 }, { "epoch": 0.44, "learning_rate": 1.2426503722619583e-05, "loss": 1.4102, "step": 16087 }, { "epoch": 0.44, "learning_rate": 1.2425645640487742e-05, "loss": 1.2996, "step": 16088 }, { "epoch": 0.44, "learning_rate": 1.2424787539378788e-05, "loss": 1.3457, "step": 16089 }, { "epoch": 0.44, "learning_rate": 1.2423929419299436e-05, "loss": 1.1929, "step": 16090 }, { "epoch": 0.44, "learning_rate": 1.24230712802564e-05, "loss": 1.2629, "step": 16091 }, { "epoch": 0.44, "learning_rate": 1.2422213122256397e-05, "loss": 1.3467, "step": 16092 }, { "epoch": 0.44, "learning_rate": 1.2421354945306132e-05, "loss": 1.4468, "step": 16093 }, { "epoch": 0.44, "learning_rate": 1.242049674941233e-05, "loss": 1.4014, "step": 16094 }, { "epoch": 0.44, "learning_rate": 1.2419638534581698e-05, "loss": 1.3735, "step": 16095 }, { "epoch": 0.44, "learning_rate": 1.2418780300820952e-05, "loss": 1.1802, "step": 16096 }, { "epoch": 0.44, "learning_rate": 1.2417922048136803e-05, "loss": 1.4062, "step": 16097 }, { "epoch": 0.44, "learning_rate": 1.2417063776535973e-05, "loss": 1.4497, "step": 16098 }, { "epoch": 0.44, "learning_rate": 1.2416205486025171e-05, "loss": 1.3687, "step": 16099 }, { "epoch": 0.44, "learning_rate": 1.2415347176611114e-05, "loss": 1.3157, "step": 16100 }, { "epoch": 0.44, "learning_rate": 1.2414488848300517e-05, "loss": 1.1987, "step": 16101 }, { "epoch": 0.44, "learning_rate": 1.2413630501100093e-05, "loss": 1.2559, "step": 16102 }, { "epoch": 0.44, "learning_rate": 1.241277213501656e-05, "loss": 1.1661, "step": 16103 }, { "epoch": 0.44, "learning_rate": 1.2411913750056632e-05, "loss": 1.354, "step": 16104 }, { "epoch": 0.44, "learning_rate": 1.2411055346227024e-05, "loss": 1.4302, "step": 16105 }, { "epoch": 0.44, "learning_rate": 1.2410196923534455e-05, "loss": 1.3228, "step": 16106 }, { "epoch": 0.44, "learning_rate": 1.2409338481985636e-05, "loss": 1.2515, "step": 16107 }, { "epoch": 0.44, "learning_rate": 1.2408480021587285e-05, "loss": 1.1904, "step": 16108 }, { "epoch": 0.44, "learning_rate": 1.2407621542346121e-05, "loss": 1.3572, "step": 16109 }, { "epoch": 0.44, "learning_rate": 1.2406763044268859e-05, "loss": 1.4614, "step": 16110 }, { "epoch": 0.44, "learning_rate": 1.2405904527362213e-05, "loss": 1.3445, "step": 16111 }, { "epoch": 0.44, "learning_rate": 1.2405045991632905e-05, "loss": 1.3923, "step": 16112 }, { "epoch": 0.44, "learning_rate": 1.2404187437087642e-05, "loss": 1.2504, "step": 16113 }, { "epoch": 0.44, "learning_rate": 1.2403328863733152e-05, "loss": 1.4395, "step": 16114 }, { "epoch": 0.44, "learning_rate": 1.2402470271576146e-05, "loss": 1.1648, "step": 16115 }, { "epoch": 0.44, "learning_rate": 1.2401611660623342e-05, "loss": 1.2949, "step": 16116 }, { "epoch": 0.44, "learning_rate": 1.2400753030881456e-05, "loss": 1.2656, "step": 16117 }, { "epoch": 0.44, "learning_rate": 1.239989438235721e-05, "loss": 1.4756, "step": 16118 }, { "epoch": 0.44, "learning_rate": 1.2399035715057316e-05, "loss": 1.3552, "step": 16119 }, { "epoch": 0.44, "learning_rate": 1.2398177028988496e-05, "loss": 1.2576, "step": 16120 }, { "epoch": 0.44, "learning_rate": 1.2397318324157466e-05, "loss": 1.1494, "step": 16121 }, { "epoch": 0.44, "learning_rate": 1.2396459600570944e-05, "loss": 1.3411, "step": 16122 }, { "epoch": 0.44, "learning_rate": 1.2395600858235653e-05, "loss": 1.3752, "step": 16123 }, { "epoch": 0.44, "learning_rate": 1.2394742097158303e-05, "loss": 1.3389, "step": 16124 }, { "epoch": 0.44, "learning_rate": 1.239388331734562e-05, "loss": 1.3271, "step": 16125 }, { "epoch": 0.44, "learning_rate": 1.2393024518804318e-05, "loss": 1.2998, "step": 16126 }, { "epoch": 0.44, "learning_rate": 1.2392165701541119e-05, "loss": 1.3018, "step": 16127 }, { "epoch": 0.44, "learning_rate": 1.2391306865562737e-05, "loss": 1.3088, "step": 16128 }, { "epoch": 0.44, "learning_rate": 1.2390448010875897e-05, "loss": 1.2944, "step": 16129 }, { "epoch": 0.44, "learning_rate": 1.2389589137487317e-05, "loss": 1.1804, "step": 16130 }, { "epoch": 0.44, "learning_rate": 1.2388730245403713e-05, "loss": 1.373, "step": 16131 }, { "epoch": 0.44, "learning_rate": 1.2387871334631807e-05, "loss": 1.2239, "step": 16132 }, { "epoch": 0.44, "learning_rate": 1.238701240517832e-05, "loss": 1.2202, "step": 16133 }, { "epoch": 0.44, "learning_rate": 1.238615345704997e-05, "loss": 1.3079, "step": 16134 }, { "epoch": 0.44, "learning_rate": 1.2385294490253476e-05, "loss": 1.3538, "step": 16135 }, { "epoch": 0.44, "learning_rate": 1.2384435504795558e-05, "loss": 1.1619, "step": 16136 }, { "epoch": 0.44, "learning_rate": 1.2383576500682941e-05, "loss": 1.4341, "step": 16137 }, { "epoch": 0.44, "learning_rate": 1.238271747792234e-05, "loss": 1.3496, "step": 16138 }, { "epoch": 0.44, "learning_rate": 1.2381858436520482e-05, "loss": 1.1953, "step": 16139 }, { "epoch": 0.44, "learning_rate": 1.238099937648408e-05, "loss": 1.3291, "step": 16140 }, { "epoch": 0.44, "learning_rate": 1.238014029781986e-05, "loss": 1.2632, "step": 16141 }, { "epoch": 0.44, "learning_rate": 1.237928120053454e-05, "loss": 1.2739, "step": 16142 }, { "epoch": 0.44, "learning_rate": 1.2378422084634846e-05, "loss": 1.3071, "step": 16143 }, { "epoch": 0.44, "learning_rate": 1.2377562950127493e-05, "loss": 1.2935, "step": 16144 }, { "epoch": 0.44, "learning_rate": 1.2376703797019207e-05, "loss": 1.2371, "step": 16145 }, { "epoch": 0.44, "learning_rate": 1.2375844625316706e-05, "loss": 1.311, "step": 16146 }, { "epoch": 0.44, "learning_rate": 1.2374985435026718e-05, "loss": 1.2104, "step": 16147 }, { "epoch": 0.44, "learning_rate": 1.2374126226155956e-05, "loss": 1.1562, "step": 16148 }, { "epoch": 0.44, "learning_rate": 1.2373266998711152e-05, "loss": 1.2769, "step": 16149 }, { "epoch": 0.44, "learning_rate": 1.2372407752699018e-05, "loss": 1.3662, "step": 16150 }, { "epoch": 0.44, "learning_rate": 1.2371548488126283e-05, "loss": 1.8359, "step": 16151 }, { "epoch": 0.44, "learning_rate": 1.2370689204999666e-05, "loss": 1.2143, "step": 16152 }, { "epoch": 0.44, "learning_rate": 1.2369829903325894e-05, "loss": 1.1201, "step": 16153 }, { "epoch": 0.44, "learning_rate": 1.2368970583111687e-05, "loss": 1.2566, "step": 16154 }, { "epoch": 0.44, "learning_rate": 1.2368111244363767e-05, "loss": 1.3379, "step": 16155 }, { "epoch": 0.44, "learning_rate": 1.2367251887088858e-05, "loss": 1.3679, "step": 16156 }, { "epoch": 0.44, "learning_rate": 1.2366392511293687e-05, "loss": 1.446, "step": 16157 }, { "epoch": 0.44, "learning_rate": 1.236553311698497e-05, "loss": 1.3491, "step": 16158 }, { "epoch": 0.44, "learning_rate": 1.2364673704169436e-05, "loss": 1.2368, "step": 16159 }, { "epoch": 0.44, "learning_rate": 1.2363814272853805e-05, "loss": 1.4668, "step": 16160 }, { "epoch": 0.44, "learning_rate": 1.2362954823044806e-05, "loss": 1.3391, "step": 16161 }, { "epoch": 0.44, "learning_rate": 1.2362095354749155e-05, "loss": 1.2915, "step": 16162 }, { "epoch": 0.44, "learning_rate": 1.2361235867973584e-05, "loss": 1.4119, "step": 16163 }, { "epoch": 0.44, "learning_rate": 1.2360376362724813e-05, "loss": 1.4104, "step": 16164 }, { "epoch": 0.44, "learning_rate": 1.235951683900957e-05, "loss": 1.3699, "step": 16165 }, { "epoch": 0.44, "learning_rate": 1.2358657296834573e-05, "loss": 1.3274, "step": 16166 }, { "epoch": 0.44, "learning_rate": 1.2357797736206552e-05, "loss": 1.2588, "step": 16167 }, { "epoch": 0.44, "learning_rate": 1.2356938157132227e-05, "loss": 1.2749, "step": 16168 }, { "epoch": 0.44, "learning_rate": 1.2356078559618329e-05, "loss": 1.1287, "step": 16169 }, { "epoch": 0.44, "learning_rate": 1.235521894367158e-05, "loss": 1.1707, "step": 16170 }, { "epoch": 0.44, "learning_rate": 1.2354359309298707e-05, "loss": 1.2827, "step": 16171 }, { "epoch": 0.44, "learning_rate": 1.2353499656506433e-05, "loss": 1.4009, "step": 16172 }, { "epoch": 0.44, "learning_rate": 1.2352639985301482e-05, "loss": 1.3989, "step": 16173 }, { "epoch": 0.44, "learning_rate": 1.2351780295690587e-05, "loss": 1.2666, "step": 16174 }, { "epoch": 0.44, "learning_rate": 1.2350920587680463e-05, "loss": 1.094, "step": 16175 }, { "epoch": 0.44, "learning_rate": 1.2350060861277845e-05, "loss": 1.3462, "step": 16176 }, { "epoch": 0.44, "learning_rate": 1.2349201116489456e-05, "loss": 1.1365, "step": 16177 }, { "epoch": 0.44, "learning_rate": 1.2348341353322024e-05, "loss": 1.2024, "step": 16178 }, { "epoch": 0.44, "learning_rate": 1.2347481571782269e-05, "loss": 1.3669, "step": 16179 }, { "epoch": 0.44, "learning_rate": 1.2346621771876926e-05, "loss": 1.3328, "step": 16180 }, { "epoch": 0.44, "learning_rate": 1.2345761953612714e-05, "loss": 1.3184, "step": 16181 }, { "epoch": 0.44, "learning_rate": 1.2344902116996366e-05, "loss": 1.1213, "step": 16182 }, { "epoch": 0.44, "learning_rate": 1.2344042262034606e-05, "loss": 1.1288, "step": 16183 }, { "epoch": 0.44, "learning_rate": 1.2343182388734161e-05, "loss": 1.26, "step": 16184 }, { "epoch": 0.44, "learning_rate": 1.2342322497101757e-05, "loss": 1.3489, "step": 16185 }, { "epoch": 0.44, "learning_rate": 1.2341462587144128e-05, "loss": 1.3623, "step": 16186 }, { "epoch": 0.44, "learning_rate": 1.2340602658867992e-05, "loss": 1.1865, "step": 16187 }, { "epoch": 0.44, "learning_rate": 1.2339742712280086e-05, "loss": 1.2664, "step": 16188 }, { "epoch": 0.44, "learning_rate": 1.2338882747387131e-05, "loss": 1.2903, "step": 16189 }, { "epoch": 0.44, "learning_rate": 1.2338022764195859e-05, "loss": 1.2615, "step": 16190 }, { "epoch": 0.44, "learning_rate": 1.2337162762712993e-05, "loss": 1.3352, "step": 16191 }, { "epoch": 0.44, "learning_rate": 1.2336302742945268e-05, "loss": 1.3147, "step": 16192 }, { "epoch": 0.44, "learning_rate": 1.2335442704899405e-05, "loss": 1.241, "step": 16193 }, { "epoch": 0.44, "learning_rate": 1.2334582648582138e-05, "loss": 1.3723, "step": 16194 }, { "epoch": 0.44, "learning_rate": 1.2333722574000195e-05, "loss": 1.2976, "step": 16195 }, { "epoch": 0.44, "learning_rate": 1.2332862481160306e-05, "loss": 1.3293, "step": 16196 }, { "epoch": 0.44, "learning_rate": 1.2332002370069193e-05, "loss": 1.2449, "step": 16197 }, { "epoch": 0.44, "learning_rate": 1.2331142240733594e-05, "loss": 1.1829, "step": 16198 }, { "epoch": 0.44, "learning_rate": 1.2330282093160231e-05, "loss": 1.2998, "step": 16199 }, { "epoch": 0.44, "learning_rate": 1.2329421927355838e-05, "loss": 1.3647, "step": 16200 }, { "epoch": 0.44, "learning_rate": 1.2328561743327143e-05, "loss": 1.3416, "step": 16201 }, { "epoch": 0.44, "learning_rate": 1.2327701541080879e-05, "loss": 1.2212, "step": 16202 }, { "epoch": 0.44, "learning_rate": 1.2326841320623769e-05, "loss": 1.438, "step": 16203 }, { "epoch": 0.44, "learning_rate": 1.232598108196255e-05, "loss": 1.2744, "step": 16204 }, { "epoch": 0.44, "learning_rate": 1.2325120825103945e-05, "loss": 1.3281, "step": 16205 }, { "epoch": 0.44, "learning_rate": 1.2324260550054692e-05, "loss": 1.417, "step": 16206 }, { "epoch": 0.44, "learning_rate": 1.2323400256821514e-05, "loss": 1.1997, "step": 16207 }, { "epoch": 0.44, "learning_rate": 1.2322539945411148e-05, "loss": 1.2449, "step": 16208 }, { "epoch": 0.44, "learning_rate": 1.2321679615830317e-05, "loss": 1.3325, "step": 16209 }, { "epoch": 0.44, "learning_rate": 1.2320819268085761e-05, "loss": 1.3567, "step": 16210 }, { "epoch": 0.44, "learning_rate": 1.2319958902184203e-05, "loss": 1.3516, "step": 16211 }, { "epoch": 0.44, "learning_rate": 1.231909851813238e-05, "loss": 1.1902, "step": 16212 }, { "epoch": 0.44, "learning_rate": 1.231823811593702e-05, "loss": 1.2922, "step": 16213 }, { "epoch": 0.44, "learning_rate": 1.2317377695604853e-05, "loss": 1.2705, "step": 16214 }, { "epoch": 0.44, "learning_rate": 1.2316517257142616e-05, "loss": 1.4451, "step": 16215 }, { "epoch": 0.44, "learning_rate": 1.2315656800557035e-05, "loss": 1.1599, "step": 16216 }, { "epoch": 0.44, "learning_rate": 1.2314796325854845e-05, "loss": 1.2847, "step": 16217 }, { "epoch": 0.44, "learning_rate": 1.2313935833042777e-05, "loss": 1.2646, "step": 16218 }, { "epoch": 0.44, "learning_rate": 1.231307532212756e-05, "loss": 1.4893, "step": 16219 }, { "epoch": 0.44, "learning_rate": 1.2312214793115934e-05, "loss": 1.2255, "step": 16220 }, { "epoch": 0.44, "learning_rate": 1.2311354246014626e-05, "loss": 1.3345, "step": 16221 }, { "epoch": 0.44, "learning_rate": 1.231049368083037e-05, "loss": 1.3486, "step": 16222 }, { "epoch": 0.44, "learning_rate": 1.2309633097569893e-05, "loss": 1.3501, "step": 16223 }, { "epoch": 0.44, "learning_rate": 1.2308772496239937e-05, "loss": 1.2749, "step": 16224 }, { "epoch": 0.44, "learning_rate": 1.230791187684723e-05, "loss": 1.7495, "step": 16225 }, { "epoch": 0.44, "learning_rate": 1.2307051239398506e-05, "loss": 1.2239, "step": 16226 }, { "epoch": 0.44, "learning_rate": 1.2306190583900497e-05, "loss": 1.4045, "step": 16227 }, { "epoch": 0.44, "learning_rate": 1.2305329910359937e-05, "loss": 1.252, "step": 16228 }, { "epoch": 0.44, "learning_rate": 1.2304469218783561e-05, "loss": 1.3074, "step": 16229 }, { "epoch": 0.44, "learning_rate": 1.23036085091781e-05, "loss": 1.2991, "step": 16230 }, { "epoch": 0.44, "learning_rate": 1.230274778155029e-05, "loss": 1.3064, "step": 16231 }, { "epoch": 0.44, "learning_rate": 1.2301887035906866e-05, "loss": 1.2107, "step": 16232 }, { "epoch": 0.44, "learning_rate": 1.2301026272254557e-05, "loss": 1.2126, "step": 16233 }, { "epoch": 0.44, "learning_rate": 1.2300165490600103e-05, "loss": 1.2498, "step": 16234 }, { "epoch": 0.44, "learning_rate": 1.2299304690950235e-05, "loss": 1.2317, "step": 16235 }, { "epoch": 0.44, "learning_rate": 1.2298443873311687e-05, "loss": 1.353, "step": 16236 }, { "epoch": 0.44, "learning_rate": 1.2297583037691198e-05, "loss": 1.2346, "step": 16237 }, { "epoch": 0.44, "learning_rate": 1.2296722184095498e-05, "loss": 1.3359, "step": 16238 }, { "epoch": 0.44, "learning_rate": 1.2295861312531322e-05, "loss": 1.1077, "step": 16239 }, { "epoch": 0.44, "learning_rate": 1.2295000423005408e-05, "loss": 1.7109, "step": 16240 }, { "epoch": 0.44, "learning_rate": 1.2294139515524492e-05, "loss": 1.2971, "step": 16241 }, { "epoch": 0.44, "learning_rate": 1.2293278590095304e-05, "loss": 1.3872, "step": 16242 }, { "epoch": 0.44, "learning_rate": 1.2292417646724586e-05, "loss": 1.5105, "step": 16243 }, { "epoch": 0.44, "learning_rate": 1.2291556685419067e-05, "loss": 1.481, "step": 16244 }, { "epoch": 0.44, "learning_rate": 1.2290695706185485e-05, "loss": 1.303, "step": 16245 }, { "epoch": 0.44, "learning_rate": 1.2289834709030579e-05, "loss": 1.2979, "step": 16246 }, { "epoch": 0.44, "learning_rate": 1.2288973693961083e-05, "loss": 1.4224, "step": 16247 }, { "epoch": 0.44, "learning_rate": 1.2288112660983734e-05, "loss": 1.2473, "step": 16248 }, { "epoch": 0.44, "learning_rate": 1.2287251610105268e-05, "loss": 1.2605, "step": 16249 }, { "epoch": 0.44, "learning_rate": 1.2286390541332418e-05, "loss": 1.2681, "step": 16250 }, { "epoch": 0.44, "learning_rate": 1.2285529454671927e-05, "loss": 1.4092, "step": 16251 }, { "epoch": 0.44, "learning_rate": 1.2284668350130527e-05, "loss": 1.2229, "step": 16252 }, { "epoch": 0.44, "learning_rate": 1.2283807227714957e-05, "loss": 1.2219, "step": 16253 }, { "epoch": 0.44, "learning_rate": 1.228294608743195e-05, "loss": 1.3738, "step": 16254 }, { "epoch": 0.44, "learning_rate": 1.2282084929288249e-05, "loss": 1.2283, "step": 16255 }, { "epoch": 0.44, "learning_rate": 1.2281223753290588e-05, "loss": 1.3748, "step": 16256 }, { "epoch": 0.44, "learning_rate": 1.2280362559445707e-05, "loss": 1.2871, "step": 16257 }, { "epoch": 0.44, "learning_rate": 1.2279501347760338e-05, "loss": 1.2834, "step": 16258 }, { "epoch": 0.44, "learning_rate": 1.2278640118241225e-05, "loss": 1.2717, "step": 16259 }, { "epoch": 0.44, "learning_rate": 1.2277778870895101e-05, "loss": 1.1641, "step": 16260 }, { "epoch": 0.44, "learning_rate": 1.2276917605728706e-05, "loss": 1.4697, "step": 16261 }, { "epoch": 0.44, "learning_rate": 1.227605632274878e-05, "loss": 1.356, "step": 16262 }, { "epoch": 0.44, "learning_rate": 1.2275195021962059e-05, "loss": 1.1415, "step": 16263 }, { "epoch": 0.44, "learning_rate": 1.2274333703375283e-05, "loss": 1.2769, "step": 16264 }, { "epoch": 0.44, "learning_rate": 1.2273472366995189e-05, "loss": 1.293, "step": 16265 }, { "epoch": 0.44, "learning_rate": 1.2272611012828514e-05, "loss": 1.3369, "step": 16266 }, { "epoch": 0.44, "learning_rate": 1.2271749640882003e-05, "loss": 1.3511, "step": 16267 }, { "epoch": 0.44, "learning_rate": 1.227088825116239e-05, "loss": 1.4131, "step": 16268 }, { "epoch": 0.44, "learning_rate": 1.2270026843676415e-05, "loss": 1.25, "step": 16269 }, { "epoch": 0.44, "learning_rate": 1.2269165418430815e-05, "loss": 1.2788, "step": 16270 }, { "epoch": 0.44, "learning_rate": 1.2268303975432336e-05, "loss": 1.1416, "step": 16271 }, { "epoch": 0.44, "learning_rate": 1.2267442514687709e-05, "loss": 1.2695, "step": 16272 }, { "epoch": 0.44, "learning_rate": 1.2266581036203682e-05, "loss": 1.2632, "step": 16273 }, { "epoch": 0.44, "learning_rate": 1.2265719539986987e-05, "loss": 1.2869, "step": 16274 }, { "epoch": 0.44, "learning_rate": 1.2264858026044371e-05, "loss": 1.1877, "step": 16275 }, { "epoch": 0.44, "learning_rate": 1.226399649438257e-05, "loss": 1.1658, "step": 16276 }, { "epoch": 0.44, "learning_rate": 1.226313494500832e-05, "loss": 1.4229, "step": 16277 }, { "epoch": 0.44, "learning_rate": 1.2262273377928375e-05, "loss": 1.3076, "step": 16278 }, { "epoch": 0.44, "learning_rate": 1.226141179314946e-05, "loss": 1.1821, "step": 16279 }, { "epoch": 0.44, "learning_rate": 1.2260550190678328e-05, "loss": 1.281, "step": 16280 }, { "epoch": 0.44, "learning_rate": 1.225968857052171e-05, "loss": 1.2959, "step": 16281 }, { "epoch": 0.44, "learning_rate": 1.2258826932686353e-05, "loss": 1.314, "step": 16282 }, { "epoch": 0.44, "learning_rate": 1.2257965277178995e-05, "loss": 1.4243, "step": 16283 }, { "epoch": 0.44, "learning_rate": 1.2257103604006382e-05, "loss": 1.3069, "step": 16284 }, { "epoch": 0.44, "learning_rate": 1.2256241913175248e-05, "loss": 1.4412, "step": 16285 }, { "epoch": 0.44, "learning_rate": 1.225538020469234e-05, "loss": 1.3203, "step": 16286 }, { "epoch": 0.44, "learning_rate": 1.2254518478564396e-05, "loss": 1.3708, "step": 16287 }, { "epoch": 0.44, "learning_rate": 1.2253656734798163e-05, "loss": 1.3396, "step": 16288 }, { "epoch": 0.44, "learning_rate": 1.2252794973400377e-05, "loss": 1.2844, "step": 16289 }, { "epoch": 0.44, "learning_rate": 1.2251933194377784e-05, "loss": 1.498, "step": 16290 }, { "epoch": 0.44, "learning_rate": 1.2251071397737122e-05, "loss": 1.1318, "step": 16291 }, { "epoch": 0.44, "learning_rate": 1.2250209583485135e-05, "loss": 1.335, "step": 16292 }, { "epoch": 0.44, "learning_rate": 1.2249347751628569e-05, "loss": 1.3281, "step": 16293 }, { "epoch": 0.44, "learning_rate": 1.2248485902174166e-05, "loss": 1.0614, "step": 16294 }, { "epoch": 0.45, "learning_rate": 1.224762403512866e-05, "loss": 1.1459, "step": 16295 }, { "epoch": 0.45, "learning_rate": 1.2246762150498807e-05, "loss": 1.2056, "step": 16296 }, { "epoch": 0.45, "learning_rate": 1.224590024829134e-05, "loss": 1.4084, "step": 16297 }, { "epoch": 0.45, "learning_rate": 1.2245038328513009e-05, "loss": 1.354, "step": 16298 }, { "epoch": 0.45, "learning_rate": 1.224417639117055e-05, "loss": 1.4019, "step": 16299 }, { "epoch": 0.45, "learning_rate": 1.2243314436270713e-05, "loss": 1.407, "step": 16300 }, { "epoch": 0.45, "learning_rate": 1.2242452463820236e-05, "loss": 1.4016, "step": 16301 }, { "epoch": 0.45, "learning_rate": 1.2241590473825866e-05, "loss": 1.2617, "step": 16302 }, { "epoch": 0.45, "learning_rate": 1.2240728466294347e-05, "loss": 1.2739, "step": 16303 }, { "epoch": 0.45, "learning_rate": 1.2239866441232423e-05, "loss": 1.2466, "step": 16304 }, { "epoch": 0.45, "learning_rate": 1.2239004398646836e-05, "loss": 1.1578, "step": 16305 }, { "epoch": 0.45, "learning_rate": 1.2238142338544333e-05, "loss": 1.4348, "step": 16306 }, { "epoch": 0.45, "learning_rate": 1.2237280260931653e-05, "loss": 1.2952, "step": 16307 }, { "epoch": 0.45, "learning_rate": 1.2236418165815547e-05, "loss": 1.231, "step": 16308 }, { "epoch": 0.45, "learning_rate": 1.2235556053202756e-05, "loss": 1.3777, "step": 16309 }, { "epoch": 0.45, "learning_rate": 1.2234693923100027e-05, "loss": 1.3813, "step": 16310 }, { "epoch": 0.45, "learning_rate": 1.2233831775514103e-05, "loss": 1.2781, "step": 16311 }, { "epoch": 0.45, "learning_rate": 1.223296961045173e-05, "loss": 1.3689, "step": 16312 }, { "epoch": 0.45, "learning_rate": 1.2232107427919653e-05, "loss": 1.3813, "step": 16313 }, { "epoch": 0.45, "learning_rate": 1.2231245227924617e-05, "loss": 1.3535, "step": 16314 }, { "epoch": 0.45, "learning_rate": 1.2230383010473365e-05, "loss": 1.3538, "step": 16315 }, { "epoch": 0.45, "learning_rate": 1.222952077557265e-05, "loss": 1.1938, "step": 16316 }, { "epoch": 0.45, "learning_rate": 1.222865852322921e-05, "loss": 1.2856, "step": 16317 }, { "epoch": 0.45, "learning_rate": 1.2227796253449792e-05, "loss": 1.2595, "step": 16318 }, { "epoch": 0.45, "learning_rate": 1.2226933966241146e-05, "loss": 1.4385, "step": 16319 }, { "epoch": 0.45, "learning_rate": 1.2226071661610015e-05, "loss": 1.4382, "step": 16320 }, { "epoch": 0.45, "learning_rate": 1.2225209339563144e-05, "loss": 1.4336, "step": 16321 }, { "epoch": 0.45, "learning_rate": 1.2224347000107286e-05, "loss": 1.0974, "step": 16322 }, { "epoch": 0.45, "learning_rate": 1.2223484643249179e-05, "loss": 1.1311, "step": 16323 }, { "epoch": 0.45, "learning_rate": 1.2222622268995576e-05, "loss": 1.3228, "step": 16324 }, { "epoch": 0.45, "learning_rate": 1.2221759877353222e-05, "loss": 1.219, "step": 16325 }, { "epoch": 0.45, "learning_rate": 1.2220897468328862e-05, "loss": 1.3022, "step": 16326 }, { "epoch": 0.45, "learning_rate": 1.2220035041929246e-05, "loss": 1.7549, "step": 16327 }, { "epoch": 0.45, "learning_rate": 1.2219172598161118e-05, "loss": 1.2476, "step": 16328 }, { "epoch": 0.45, "learning_rate": 1.2218310137031229e-05, "loss": 1.228, "step": 16329 }, { "epoch": 0.45, "learning_rate": 1.2217447658546322e-05, "loss": 1.1807, "step": 16330 }, { "epoch": 0.45, "learning_rate": 1.221658516271315e-05, "loss": 1.3972, "step": 16331 }, { "epoch": 0.45, "learning_rate": 1.2215722649538458e-05, "loss": 1.2917, "step": 16332 }, { "epoch": 0.45, "learning_rate": 1.2214860119028991e-05, "loss": 1.2383, "step": 16333 }, { "epoch": 0.45, "learning_rate": 1.22139975711915e-05, "loss": 1.4385, "step": 16334 }, { "epoch": 0.45, "learning_rate": 1.2213135006032735e-05, "loss": 1.396, "step": 16335 }, { "epoch": 0.45, "learning_rate": 1.2212272423559444e-05, "loss": 1.3096, "step": 16336 }, { "epoch": 0.45, "learning_rate": 1.221140982377837e-05, "loss": 1.4004, "step": 16337 }, { "epoch": 0.45, "learning_rate": 1.2210547206696268e-05, "loss": 1.3, "step": 16338 }, { "epoch": 0.45, "learning_rate": 1.2209684572319885e-05, "loss": 1.3232, "step": 16339 }, { "epoch": 0.45, "learning_rate": 1.2208821920655965e-05, "loss": 1.2781, "step": 16340 }, { "epoch": 0.45, "learning_rate": 1.2207959251711265e-05, "loss": 1.3135, "step": 16341 }, { "epoch": 0.45, "learning_rate": 1.2207096565492527e-05, "loss": 1.3123, "step": 16342 }, { "epoch": 0.45, "learning_rate": 1.2206233862006506e-05, "loss": 1.3594, "step": 16343 }, { "epoch": 0.45, "learning_rate": 1.2205371141259948e-05, "loss": 1.3293, "step": 16344 }, { "epoch": 0.45, "learning_rate": 1.2204508403259603e-05, "loss": 1.4231, "step": 16345 }, { "epoch": 0.45, "learning_rate": 1.2203645648012218e-05, "loss": 1.3472, "step": 16346 }, { "epoch": 0.45, "learning_rate": 1.220278287552455e-05, "loss": 1.3545, "step": 16347 }, { "epoch": 0.45, "learning_rate": 1.2201920085803342e-05, "loss": 1.2266, "step": 16348 }, { "epoch": 0.45, "learning_rate": 1.220105727885535e-05, "loss": 1.3967, "step": 16349 }, { "epoch": 0.45, "learning_rate": 1.2200194454687317e-05, "loss": 1.3755, "step": 16350 }, { "epoch": 0.45, "learning_rate": 1.2199331613306e-05, "loss": 1.3025, "step": 16351 }, { "epoch": 0.45, "learning_rate": 1.2198468754718144e-05, "loss": 1.3167, "step": 16352 }, { "epoch": 0.45, "learning_rate": 1.2197605878930506e-05, "loss": 1.3269, "step": 16353 }, { "epoch": 0.45, "learning_rate": 1.2196742985949825e-05, "loss": 1.2466, "step": 16354 }, { "epoch": 0.45, "learning_rate": 1.2195880075782869e-05, "loss": 1.2732, "step": 16355 }, { "epoch": 0.45, "learning_rate": 1.2195017148436374e-05, "loss": 1.2505, "step": 16356 }, { "epoch": 0.45, "learning_rate": 1.21941542039171e-05, "loss": 1.3171, "step": 16357 }, { "epoch": 0.45, "learning_rate": 1.2193291242231795e-05, "loss": 1.2671, "step": 16358 }, { "epoch": 0.45, "learning_rate": 1.2192428263387211e-05, "loss": 1.3147, "step": 16359 }, { "epoch": 0.45, "learning_rate": 1.2191565267390098e-05, "loss": 1.2004, "step": 16360 }, { "epoch": 0.45, "learning_rate": 1.2190702254247209e-05, "loss": 1.343, "step": 16361 }, { "epoch": 0.45, "learning_rate": 1.2189839223965296e-05, "loss": 1.2004, "step": 16362 }, { "epoch": 0.45, "learning_rate": 1.218897617655111e-05, "loss": 1.3137, "step": 16363 }, { "epoch": 0.45, "learning_rate": 1.2188113112011407e-05, "loss": 1.2222, "step": 16364 }, { "epoch": 0.45, "learning_rate": 1.2187250030352934e-05, "loss": 1.4448, "step": 16365 }, { "epoch": 0.45, "learning_rate": 1.2186386931582442e-05, "loss": 1.2915, "step": 16366 }, { "epoch": 0.45, "learning_rate": 1.218552381570669e-05, "loss": 1.3667, "step": 16367 }, { "epoch": 0.45, "learning_rate": 1.2184660682732426e-05, "loss": 1.3071, "step": 16368 }, { "epoch": 0.45, "learning_rate": 1.2183797532666403e-05, "loss": 1.1487, "step": 16369 }, { "epoch": 0.45, "learning_rate": 1.2182934365515377e-05, "loss": 1.3174, "step": 16370 }, { "epoch": 0.45, "learning_rate": 1.21820711812861e-05, "loss": 1.311, "step": 16371 }, { "epoch": 0.45, "learning_rate": 1.2181207979985321e-05, "loss": 1.3838, "step": 16372 }, { "epoch": 0.45, "learning_rate": 1.21803447616198e-05, "loss": 1.2627, "step": 16373 }, { "epoch": 0.45, "learning_rate": 1.2179481526196285e-05, "loss": 1.334, "step": 16374 }, { "epoch": 0.45, "learning_rate": 1.2178618273721533e-05, "loss": 1.1663, "step": 16375 }, { "epoch": 0.45, "learning_rate": 1.2177755004202294e-05, "loss": 1.6567, "step": 16376 }, { "epoch": 0.45, "learning_rate": 1.2176891717645325e-05, "loss": 1.384, "step": 16377 }, { "epoch": 0.45, "learning_rate": 1.2176028414057379e-05, "loss": 1.4263, "step": 16378 }, { "epoch": 0.45, "learning_rate": 1.217516509344521e-05, "loss": 1.3606, "step": 16379 }, { "epoch": 0.45, "learning_rate": 1.2174301755815572e-05, "loss": 1.7524, "step": 16380 }, { "epoch": 0.45, "learning_rate": 1.2173438401175219e-05, "loss": 1.4326, "step": 16381 }, { "epoch": 0.45, "learning_rate": 1.2172575029530903e-05, "loss": 1.5635, "step": 16382 }, { "epoch": 0.45, "learning_rate": 1.2171711640889388e-05, "loss": 1.3682, "step": 16383 }, { "epoch": 0.45, "learning_rate": 1.2170848235257418e-05, "loss": 1.2495, "step": 16384 }, { "epoch": 0.45, "learning_rate": 1.2169984812641753e-05, "loss": 1.3459, "step": 16385 }, { "epoch": 0.45, "learning_rate": 1.2169121373049149e-05, "loss": 1.2876, "step": 16386 }, { "epoch": 0.45, "learning_rate": 1.2168257916486356e-05, "loss": 1.3022, "step": 16387 }, { "epoch": 0.45, "learning_rate": 1.2167394442960134e-05, "loss": 1.428, "step": 16388 }, { "epoch": 0.45, "learning_rate": 1.2166530952477238e-05, "loss": 1.3594, "step": 16389 }, { "epoch": 0.45, "learning_rate": 1.2165667445044422e-05, "loss": 1.2515, "step": 16390 }, { "epoch": 0.45, "learning_rate": 1.2164803920668443e-05, "loss": 1.2634, "step": 16391 }, { "epoch": 0.45, "learning_rate": 1.2163940379356057e-05, "loss": 1.3604, "step": 16392 }, { "epoch": 0.45, "learning_rate": 1.2163076821114015e-05, "loss": 1.2656, "step": 16393 }, { "epoch": 0.45, "learning_rate": 1.2162213245949082e-05, "loss": 1.3088, "step": 16394 }, { "epoch": 0.45, "learning_rate": 1.2161349653868006e-05, "loss": 1.2925, "step": 16395 }, { "epoch": 0.45, "learning_rate": 1.2160486044877549e-05, "loss": 1.1407, "step": 16396 }, { "epoch": 0.45, "learning_rate": 1.2159622418984463e-05, "loss": 1.3464, "step": 16397 }, { "epoch": 0.45, "learning_rate": 1.2158758776195507e-05, "loss": 1.2993, "step": 16398 }, { "epoch": 0.45, "learning_rate": 1.2157895116517438e-05, "loss": 1.3794, "step": 16399 }, { "epoch": 0.45, "learning_rate": 1.215703143995701e-05, "loss": 1.5022, "step": 16400 }, { "epoch": 0.45, "learning_rate": 1.2156167746520984e-05, "loss": 1.3, "step": 16401 }, { "epoch": 0.45, "learning_rate": 1.2155304036216118e-05, "loss": 1.2996, "step": 16402 }, { "epoch": 0.45, "learning_rate": 1.2154440309049162e-05, "loss": 1.2888, "step": 16403 }, { "epoch": 0.45, "learning_rate": 1.2153576565026883e-05, "loss": 1.2319, "step": 16404 }, { "epoch": 0.45, "learning_rate": 1.215271280415603e-05, "loss": 1.2627, "step": 16405 }, { "epoch": 0.45, "learning_rate": 1.2151849026443368e-05, "loss": 1.3245, "step": 16406 }, { "epoch": 0.45, "learning_rate": 1.2150985231895647e-05, "loss": 1.2947, "step": 16407 }, { "epoch": 0.45, "learning_rate": 1.2150121420519632e-05, "loss": 1.2957, "step": 16408 }, { "epoch": 0.45, "learning_rate": 1.2149257592322076e-05, "loss": 1.4116, "step": 16409 }, { "epoch": 0.45, "learning_rate": 1.2148393747309742e-05, "loss": 1.3293, "step": 16410 }, { "epoch": 0.45, "learning_rate": 1.2147529885489383e-05, "loss": 1.2349, "step": 16411 }, { "epoch": 0.45, "learning_rate": 1.2146666006867762e-05, "loss": 1.3535, "step": 16412 }, { "epoch": 0.45, "learning_rate": 1.2145802111451632e-05, "loss": 1.2385, "step": 16413 }, { "epoch": 0.45, "learning_rate": 1.214493819924776e-05, "loss": 1.2615, "step": 16414 }, { "epoch": 0.45, "learning_rate": 1.2144074270262896e-05, "loss": 1.3311, "step": 16415 }, { "epoch": 0.45, "learning_rate": 1.2143210324503804e-05, "loss": 1.1877, "step": 16416 }, { "epoch": 0.45, "learning_rate": 1.2142346361977241e-05, "loss": 1.2312, "step": 16417 }, { "epoch": 0.45, "learning_rate": 1.2141482382689973e-05, "loss": 1.322, "step": 16418 }, { "epoch": 0.45, "learning_rate": 1.2140618386648747e-05, "loss": 1.292, "step": 16419 }, { "epoch": 0.45, "learning_rate": 1.2139754373860335e-05, "loss": 1.0674, "step": 16420 }, { "epoch": 0.45, "learning_rate": 1.213889034433149e-05, "loss": 1.1953, "step": 16421 }, { "epoch": 0.45, "learning_rate": 1.213802629806897e-05, "loss": 1.186, "step": 16422 }, { "epoch": 0.45, "learning_rate": 1.2137162235079538e-05, "loss": 1.3418, "step": 16423 }, { "epoch": 0.45, "learning_rate": 1.2136298155369956e-05, "loss": 1.2688, "step": 16424 }, { "epoch": 0.45, "learning_rate": 1.213543405894698e-05, "loss": 1.3066, "step": 16425 }, { "epoch": 0.45, "learning_rate": 1.2134569945817374e-05, "loss": 1.4255, "step": 16426 }, { "epoch": 0.45, "learning_rate": 1.2133705815987893e-05, "loss": 1.3164, "step": 16427 }, { "epoch": 0.45, "learning_rate": 1.2132841669465304e-05, "loss": 1.249, "step": 16428 }, { "epoch": 0.45, "learning_rate": 1.2131977506256365e-05, "loss": 1.3098, "step": 16429 }, { "epoch": 0.45, "learning_rate": 1.2131113326367836e-05, "loss": 1.3301, "step": 16430 }, { "epoch": 0.45, "learning_rate": 1.2130249129806475e-05, "loss": 1.1353, "step": 16431 }, { "epoch": 0.45, "learning_rate": 1.212938491657905e-05, "loss": 1.2634, "step": 16432 }, { "epoch": 0.45, "learning_rate": 1.2128520686692318e-05, "loss": 1.2793, "step": 16433 }, { "epoch": 0.45, "learning_rate": 1.2127656440153041e-05, "loss": 1.1809, "step": 16434 }, { "epoch": 0.45, "learning_rate": 1.212679217696798e-05, "loss": 1.2581, "step": 16435 }, { "epoch": 0.45, "learning_rate": 1.2125927897143898e-05, "loss": 1.4409, "step": 16436 }, { "epoch": 0.45, "learning_rate": 1.2125063600687557e-05, "loss": 1.2554, "step": 16437 }, { "epoch": 0.45, "learning_rate": 1.2124199287605716e-05, "loss": 1.4214, "step": 16438 }, { "epoch": 0.45, "learning_rate": 1.212333495790514e-05, "loss": 1.3059, "step": 16439 }, { "epoch": 0.45, "learning_rate": 1.2122470611592587e-05, "loss": 1.4521, "step": 16440 }, { "epoch": 0.45, "learning_rate": 1.2121606248674823e-05, "loss": 1.2993, "step": 16441 }, { "epoch": 0.45, "learning_rate": 1.212074186915861e-05, "loss": 1.2048, "step": 16442 }, { "epoch": 0.45, "learning_rate": 1.2119877473050712e-05, "loss": 1.3601, "step": 16443 }, { "epoch": 0.45, "learning_rate": 1.2119013060357885e-05, "loss": 1.7148, "step": 16444 }, { "epoch": 0.45, "learning_rate": 1.21181486310869e-05, "loss": 1.3062, "step": 16445 }, { "epoch": 0.45, "learning_rate": 1.2117284185244513e-05, "loss": 1.6323, "step": 16446 }, { "epoch": 0.45, "learning_rate": 1.2116419722837492e-05, "loss": 1.3767, "step": 16447 }, { "epoch": 0.45, "learning_rate": 1.2115555243872596e-05, "loss": 1.311, "step": 16448 }, { "epoch": 0.45, "learning_rate": 1.2114690748356594e-05, "loss": 1.3904, "step": 16449 }, { "epoch": 0.45, "learning_rate": 1.2113826236296245e-05, "loss": 1.3706, "step": 16450 }, { "epoch": 0.45, "learning_rate": 1.2112961707698312e-05, "loss": 1.2893, "step": 16451 }, { "epoch": 0.45, "learning_rate": 1.2112097162569562e-05, "loss": 1.072, "step": 16452 }, { "epoch": 0.45, "learning_rate": 1.2111232600916756e-05, "loss": 1.1892, "step": 16453 }, { "epoch": 0.45, "learning_rate": 1.2110368022746659e-05, "loss": 1.4058, "step": 16454 }, { "epoch": 0.45, "learning_rate": 1.2109503428066036e-05, "loss": 1.2444, "step": 16455 }, { "epoch": 0.45, "learning_rate": 1.2108638816881648e-05, "loss": 1.1711, "step": 16456 }, { "epoch": 0.45, "learning_rate": 1.2107774189200265e-05, "loss": 1.2488, "step": 16457 }, { "epoch": 0.45, "learning_rate": 1.2106909545028644e-05, "loss": 1.3081, "step": 16458 }, { "epoch": 0.45, "learning_rate": 1.2106044884373555e-05, "loss": 1.2915, "step": 16459 }, { "epoch": 0.45, "learning_rate": 1.2105180207241763e-05, "loss": 1.3716, "step": 16460 }, { "epoch": 0.45, "learning_rate": 1.2104315513640028e-05, "loss": 1.376, "step": 16461 }, { "epoch": 0.45, "learning_rate": 1.2103450803575116e-05, "loss": 1.3071, "step": 16462 }, { "epoch": 0.45, "learning_rate": 1.21025860770538e-05, "loss": 1.3191, "step": 16463 }, { "epoch": 0.45, "learning_rate": 1.2101721334082834e-05, "loss": 1.3518, "step": 16464 }, { "epoch": 0.45, "learning_rate": 1.2100856574668992e-05, "loss": 1.3608, "step": 16465 }, { "epoch": 0.45, "learning_rate": 1.2099991798819035e-05, "loss": 1.3198, "step": 16466 }, { "epoch": 0.45, "learning_rate": 1.2099127006539731e-05, "loss": 1.3623, "step": 16467 }, { "epoch": 0.45, "learning_rate": 1.2098262197837842e-05, "loss": 1.4155, "step": 16468 }, { "epoch": 0.45, "learning_rate": 1.2097397372720139e-05, "loss": 1.3508, "step": 16469 }, { "epoch": 0.45, "learning_rate": 1.2096532531193383e-05, "loss": 1.3542, "step": 16470 }, { "epoch": 0.45, "learning_rate": 1.2095667673264345e-05, "loss": 1.448, "step": 16471 }, { "epoch": 0.45, "learning_rate": 1.2094802798939784e-05, "loss": 1.3989, "step": 16472 }, { "epoch": 0.45, "learning_rate": 1.2093937908226474e-05, "loss": 1.3525, "step": 16473 }, { "epoch": 0.45, "learning_rate": 1.2093073001131178e-05, "loss": 1.334, "step": 16474 }, { "epoch": 0.45, "learning_rate": 1.2092208077660662e-05, "loss": 1.2463, "step": 16475 }, { "epoch": 0.45, "learning_rate": 1.2091343137821696e-05, "loss": 1.1812, "step": 16476 }, { "epoch": 0.45, "learning_rate": 1.2090478181621044e-05, "loss": 1.2058, "step": 16477 }, { "epoch": 0.45, "learning_rate": 1.2089613209065472e-05, "loss": 1.3335, "step": 16478 }, { "epoch": 0.45, "learning_rate": 1.208874822016175e-05, "loss": 1.2876, "step": 16479 }, { "epoch": 0.45, "learning_rate": 1.2087883214916645e-05, "loss": 1.4014, "step": 16480 }, { "epoch": 0.45, "learning_rate": 1.208701819333692e-05, "loss": 1.3247, "step": 16481 }, { "epoch": 0.45, "learning_rate": 1.2086153155429349e-05, "loss": 1.2483, "step": 16482 }, { "epoch": 0.45, "learning_rate": 1.2085288101200698e-05, "loss": 1.3875, "step": 16483 }, { "epoch": 0.45, "learning_rate": 1.2084423030657731e-05, "loss": 1.438, "step": 16484 }, { "epoch": 0.45, "learning_rate": 1.208355794380722e-05, "loss": 1.4229, "step": 16485 }, { "epoch": 0.45, "learning_rate": 1.208269284065593e-05, "loss": 1.2874, "step": 16486 }, { "epoch": 0.45, "learning_rate": 1.2081827721210634e-05, "loss": 1.2703, "step": 16487 }, { "epoch": 0.45, "learning_rate": 1.2080962585478092e-05, "loss": 1.4026, "step": 16488 }, { "epoch": 0.45, "learning_rate": 1.2080097433465079e-05, "loss": 1.4976, "step": 16489 }, { "epoch": 0.45, "learning_rate": 1.2079232265178362e-05, "loss": 1.2905, "step": 16490 }, { "epoch": 0.45, "learning_rate": 1.2078367080624712e-05, "loss": 1.3074, "step": 16491 }, { "epoch": 0.45, "learning_rate": 1.2077501879810891e-05, "loss": 1.2866, "step": 16492 }, { "epoch": 0.45, "learning_rate": 1.2076636662743673e-05, "loss": 1.3237, "step": 16493 }, { "epoch": 0.45, "learning_rate": 1.2075771429429829e-05, "loss": 1.3818, "step": 16494 }, { "epoch": 0.45, "learning_rate": 1.2074906179876122e-05, "loss": 1.4119, "step": 16495 }, { "epoch": 0.45, "learning_rate": 1.207404091408933e-05, "loss": 1.2683, "step": 16496 }, { "epoch": 0.45, "learning_rate": 1.207317563207621e-05, "loss": 1.3403, "step": 16497 }, { "epoch": 0.45, "learning_rate": 1.2072310333843544e-05, "loss": 1.3162, "step": 16498 }, { "epoch": 0.45, "learning_rate": 1.2071445019398094e-05, "loss": 1.1323, "step": 16499 }, { "epoch": 0.45, "learning_rate": 1.2070579688746635e-05, "loss": 1.3262, "step": 16500 }, { "epoch": 0.45, "learning_rate": 1.206971434189593e-05, "loss": 1.2732, "step": 16501 }, { "epoch": 0.45, "learning_rate": 1.2068848978852756e-05, "loss": 1.3757, "step": 16502 }, { "epoch": 0.45, "learning_rate": 1.206798359962388e-05, "loss": 1.2407, "step": 16503 }, { "epoch": 0.45, "learning_rate": 1.2067118204216075e-05, "loss": 1.2683, "step": 16504 }, { "epoch": 0.45, "learning_rate": 1.2066252792636104e-05, "loss": 1.2656, "step": 16505 }, { "epoch": 0.45, "learning_rate": 1.2065387364890748e-05, "loss": 1.2571, "step": 16506 }, { "epoch": 0.45, "learning_rate": 1.2064521920986769e-05, "loss": 1.1531, "step": 16507 }, { "epoch": 0.45, "learning_rate": 1.2063656460930943e-05, "loss": 1.3616, "step": 16508 }, { "epoch": 0.45, "learning_rate": 1.2062790984730035e-05, "loss": 1.4277, "step": 16509 }, { "epoch": 0.45, "learning_rate": 1.2061925492390827e-05, "loss": 1.4155, "step": 16510 }, { "epoch": 0.45, "learning_rate": 1.2061059983920078e-05, "loss": 1.1243, "step": 16511 }, { "epoch": 0.45, "learning_rate": 1.206019445932457e-05, "loss": 1.4163, "step": 16512 }, { "epoch": 0.45, "learning_rate": 1.2059328918611065e-05, "loss": 1.4346, "step": 16513 }, { "epoch": 0.45, "learning_rate": 1.205846336178634e-05, "loss": 1.2078, "step": 16514 }, { "epoch": 0.45, "learning_rate": 1.2057597788857167e-05, "loss": 1.2246, "step": 16515 }, { "epoch": 0.45, "learning_rate": 1.2056732199830317e-05, "loss": 1.3657, "step": 16516 }, { "epoch": 0.45, "learning_rate": 1.205586659471256e-05, "loss": 1.293, "step": 16517 }, { "epoch": 0.45, "learning_rate": 1.205500097351067e-05, "loss": 1.3591, "step": 16518 }, { "epoch": 0.45, "learning_rate": 1.2054135336231417e-05, "loss": 1.3914, "step": 16519 }, { "epoch": 0.45, "learning_rate": 1.2053269682881576e-05, "loss": 1.2207, "step": 16520 }, { "epoch": 0.45, "learning_rate": 1.205240401346792e-05, "loss": 1.3091, "step": 16521 }, { "epoch": 0.45, "learning_rate": 1.2051538327997219e-05, "loss": 1.2644, "step": 16522 }, { "epoch": 0.45, "learning_rate": 1.2050672626476247e-05, "loss": 1.2827, "step": 16523 }, { "epoch": 0.45, "learning_rate": 1.2049806908911775e-05, "loss": 1.3691, "step": 16524 }, { "epoch": 0.45, "learning_rate": 1.2048941175310578e-05, "loss": 1.2644, "step": 16525 }, { "epoch": 0.45, "learning_rate": 1.204807542567943e-05, "loss": 1.239, "step": 16526 }, { "epoch": 0.45, "learning_rate": 1.2047209660025103e-05, "loss": 1.2612, "step": 16527 }, { "epoch": 0.45, "learning_rate": 1.2046343878354372e-05, "loss": 1.3569, "step": 16528 }, { "epoch": 0.45, "learning_rate": 1.2045478080674005e-05, "loss": 1.3523, "step": 16529 }, { "epoch": 0.45, "learning_rate": 1.2044612266990783e-05, "loss": 1.2659, "step": 16530 }, { "epoch": 0.45, "learning_rate": 1.2043746437311473e-05, "loss": 1.408, "step": 16531 }, { "epoch": 0.45, "learning_rate": 1.2042880591642854e-05, "loss": 1.4133, "step": 16532 }, { "epoch": 0.45, "learning_rate": 1.2042014729991696e-05, "loss": 1.3228, "step": 16533 }, { "epoch": 0.45, "learning_rate": 1.2041148852364776e-05, "loss": 1.3872, "step": 16534 }, { "epoch": 0.45, "learning_rate": 1.2040282958768868e-05, "loss": 1.519, "step": 16535 }, { "epoch": 0.45, "learning_rate": 1.2039417049210744e-05, "loss": 1.314, "step": 16536 }, { "epoch": 0.45, "learning_rate": 1.203855112369718e-05, "loss": 1.2456, "step": 16537 }, { "epoch": 0.45, "learning_rate": 1.2037685182234953e-05, "loss": 1.1897, "step": 16538 }, { "epoch": 0.45, "learning_rate": 1.2036819224830833e-05, "loss": 1.3267, "step": 16539 }, { "epoch": 0.45, "learning_rate": 1.2035953251491596e-05, "loss": 1.3467, "step": 16540 }, { "epoch": 0.45, "learning_rate": 1.2035087262224022e-05, "loss": 1.1229, "step": 16541 }, { "epoch": 0.45, "learning_rate": 1.2034221257034879e-05, "loss": 1.2446, "step": 16542 }, { "epoch": 0.45, "learning_rate": 1.2033355235930949e-05, "loss": 1.2729, "step": 16543 }, { "epoch": 0.45, "learning_rate": 1.2032489198919e-05, "loss": 1.2373, "step": 16544 }, { "epoch": 0.45, "learning_rate": 1.2031623146005813e-05, "loss": 1.1636, "step": 16545 }, { "epoch": 0.45, "learning_rate": 1.203075707719816e-05, "loss": 1.3677, "step": 16546 }, { "epoch": 0.45, "learning_rate": 1.2029890992502822e-05, "loss": 1.281, "step": 16547 }, { "epoch": 0.45, "learning_rate": 1.2029024891926568e-05, "loss": 1.1628, "step": 16548 }, { "epoch": 0.45, "learning_rate": 1.202815877547618e-05, "loss": 1.1711, "step": 16549 }, { "epoch": 0.45, "learning_rate": 1.202729264315843e-05, "loss": 1.4146, "step": 16550 }, { "epoch": 0.45, "learning_rate": 1.2026426494980096e-05, "loss": 1.3311, "step": 16551 }, { "epoch": 0.45, "learning_rate": 1.2025560330947954e-05, "loss": 1.2234, "step": 16552 }, { "epoch": 0.45, "learning_rate": 1.202469415106878e-05, "loss": 1.4363, "step": 16553 }, { "epoch": 0.45, "learning_rate": 1.2023827955349353e-05, "loss": 1.3262, "step": 16554 }, { "epoch": 0.45, "learning_rate": 1.2022961743796444e-05, "loss": 1.321, "step": 16555 }, { "epoch": 0.45, "learning_rate": 1.2022095516416834e-05, "loss": 1.2676, "step": 16556 }, { "epoch": 0.45, "learning_rate": 1.2021229273217303e-05, "loss": 1.4512, "step": 16557 }, { "epoch": 0.45, "learning_rate": 1.2020363014204622e-05, "loss": 1.4185, "step": 16558 }, { "epoch": 0.45, "learning_rate": 1.2019496739385573e-05, "loss": 1.3132, "step": 16559 }, { "epoch": 0.45, "learning_rate": 1.2018630448766928e-05, "loss": 1.4553, "step": 16560 }, { "epoch": 0.45, "learning_rate": 1.2017764142355471e-05, "loss": 1.3555, "step": 16561 }, { "epoch": 0.45, "learning_rate": 1.2016897820157973e-05, "loss": 1.3008, "step": 16562 }, { "epoch": 0.45, "learning_rate": 1.2016031482181218e-05, "loss": 1.2173, "step": 16563 }, { "epoch": 0.45, "learning_rate": 1.2015165128431978e-05, "loss": 1.3401, "step": 16564 }, { "epoch": 0.45, "learning_rate": 1.2014298758917037e-05, "loss": 1.2095, "step": 16565 }, { "epoch": 0.45, "learning_rate": 1.2013432373643165e-05, "loss": 1.28, "step": 16566 }, { "epoch": 0.45, "learning_rate": 1.2012565972617149e-05, "loss": 1.3428, "step": 16567 }, { "epoch": 0.45, "learning_rate": 1.2011699555845762e-05, "loss": 1.4165, "step": 16568 }, { "epoch": 0.45, "learning_rate": 1.2010833123335784e-05, "loss": 1.4604, "step": 16569 }, { "epoch": 0.45, "learning_rate": 1.200996667509399e-05, "loss": 1.3342, "step": 16570 }, { "epoch": 0.45, "learning_rate": 1.2009100211127165e-05, "loss": 1.3064, "step": 16571 }, { "epoch": 0.45, "learning_rate": 1.2008233731442083e-05, "loss": 1.3398, "step": 16572 }, { "epoch": 0.45, "learning_rate": 1.2007367236045527e-05, "loss": 1.2124, "step": 16573 }, { "epoch": 0.45, "learning_rate": 1.200650072494427e-05, "loss": 1.2805, "step": 16574 }, { "epoch": 0.45, "learning_rate": 1.20056341981451e-05, "loss": 1.2991, "step": 16575 }, { "epoch": 0.45, "learning_rate": 1.2004767655654788e-05, "loss": 1.3557, "step": 16576 }, { "epoch": 0.45, "learning_rate": 1.2003901097480117e-05, "loss": 1.3906, "step": 16577 }, { "epoch": 0.45, "learning_rate": 1.2003034523627865e-05, "loss": 1.4446, "step": 16578 }, { "epoch": 0.45, "learning_rate": 1.2002167934104815e-05, "loss": 1.1388, "step": 16579 }, { "epoch": 0.45, "learning_rate": 1.2001301328917743e-05, "loss": 1.1553, "step": 16580 }, { "epoch": 0.45, "learning_rate": 1.2000434708073432e-05, "loss": 1.2893, "step": 16581 }, { "epoch": 0.45, "learning_rate": 1.1999568071578658e-05, "loss": 1.259, "step": 16582 }, { "epoch": 0.45, "learning_rate": 1.1998701419440206e-05, "loss": 1.2881, "step": 16583 }, { "epoch": 0.45, "learning_rate": 1.1997834751664852e-05, "loss": 1.3406, "step": 16584 }, { "epoch": 0.45, "learning_rate": 1.199696806825938e-05, "loss": 1.3879, "step": 16585 }, { "epoch": 0.45, "learning_rate": 1.1996101369230569e-05, "loss": 1.3909, "step": 16586 }, { "epoch": 0.45, "learning_rate": 1.1995234654585194e-05, "loss": 1.2209, "step": 16587 }, { "epoch": 0.45, "learning_rate": 1.199436792433005e-05, "loss": 1.1436, "step": 16588 }, { "epoch": 0.45, "learning_rate": 1.1993501178471903e-05, "loss": 1.1892, "step": 16589 }, { "epoch": 0.45, "learning_rate": 1.1992634417017543e-05, "loss": 1.4258, "step": 16590 }, { "epoch": 0.45, "learning_rate": 1.1991767639973748e-05, "loss": 1.4575, "step": 16591 }, { "epoch": 0.45, "learning_rate": 1.19909008473473e-05, "loss": 1.3704, "step": 16592 }, { "epoch": 0.45, "learning_rate": 1.1990034039144977e-05, "loss": 1.4387, "step": 16593 }, { "epoch": 0.45, "learning_rate": 1.1989167215373567e-05, "loss": 1.3203, "step": 16594 }, { "epoch": 0.45, "learning_rate": 1.1988300376039847e-05, "loss": 1.1121, "step": 16595 }, { "epoch": 0.45, "learning_rate": 1.1987433521150602e-05, "loss": 1.3762, "step": 16596 }, { "epoch": 0.45, "learning_rate": 1.1986566650712608e-05, "loss": 1.3528, "step": 16597 }, { "epoch": 0.45, "learning_rate": 1.198569976473265e-05, "loss": 1.3472, "step": 16598 }, { "epoch": 0.45, "learning_rate": 1.1984832863217514e-05, "loss": 1.3933, "step": 16599 }, { "epoch": 0.45, "learning_rate": 1.1983965946173976e-05, "loss": 1.2754, "step": 16600 }, { "epoch": 0.45, "learning_rate": 1.1983099013608825e-05, "loss": 1.2422, "step": 16601 }, { "epoch": 0.45, "learning_rate": 1.1982232065528838e-05, "loss": 1.3706, "step": 16602 }, { "epoch": 0.45, "learning_rate": 1.19813651019408e-05, "loss": 1.332, "step": 16603 }, { "epoch": 0.45, "learning_rate": 1.1980498122851491e-05, "loss": 1.1919, "step": 16604 }, { "epoch": 0.45, "learning_rate": 1.1979631128267696e-05, "loss": 1.3247, "step": 16605 }, { "epoch": 0.45, "learning_rate": 1.1978764118196202e-05, "loss": 1.2124, "step": 16606 }, { "epoch": 0.45, "learning_rate": 1.1977897092643784e-05, "loss": 1.1677, "step": 16607 }, { "epoch": 0.45, "learning_rate": 1.1977030051617232e-05, "loss": 1.3865, "step": 16608 }, { "epoch": 0.45, "learning_rate": 1.1976162995123324e-05, "loss": 1.3496, "step": 16609 }, { "epoch": 0.45, "learning_rate": 1.1975295923168848e-05, "loss": 1.1887, "step": 16610 }, { "epoch": 0.45, "learning_rate": 1.1974428835760584e-05, "loss": 1.335, "step": 16611 }, { "epoch": 0.45, "learning_rate": 1.1973561732905319e-05, "loss": 1.2798, "step": 16612 }, { "epoch": 0.45, "learning_rate": 1.1972694614609834e-05, "loss": 1.3389, "step": 16613 }, { "epoch": 0.45, "learning_rate": 1.1971827480880916e-05, "loss": 1.2773, "step": 16614 }, { "epoch": 0.45, "learning_rate": 1.1970960331725343e-05, "loss": 1.3979, "step": 16615 }, { "epoch": 0.45, "learning_rate": 1.1970093167149906e-05, "loss": 1.4529, "step": 16616 }, { "epoch": 0.45, "learning_rate": 1.1969225987161384e-05, "loss": 1.4065, "step": 16617 }, { "epoch": 0.45, "learning_rate": 1.1968358791766565e-05, "loss": 1.2695, "step": 16618 }, { "epoch": 0.45, "learning_rate": 1.1967491580972232e-05, "loss": 1.2881, "step": 16619 }, { "epoch": 0.45, "learning_rate": 1.1966624354785172e-05, "loss": 1.2747, "step": 16620 }, { "epoch": 0.45, "learning_rate": 1.1965757113212166e-05, "loss": 1.2888, "step": 16621 }, { "epoch": 0.45, "learning_rate": 1.1964889856260002e-05, "loss": 1.4102, "step": 16622 }, { "epoch": 0.45, "learning_rate": 1.1964022583935462e-05, "loss": 1.4011, "step": 16623 }, { "epoch": 0.45, "learning_rate": 1.1963155296245336e-05, "loss": 1.3062, "step": 16624 }, { "epoch": 0.45, "learning_rate": 1.1962287993196404e-05, "loss": 1.2249, "step": 16625 }, { "epoch": 0.45, "learning_rate": 1.1961420674795453e-05, "loss": 1.4358, "step": 16626 }, { "epoch": 0.45, "learning_rate": 1.196055334104927e-05, "loss": 1.364, "step": 16627 }, { "epoch": 0.45, "learning_rate": 1.195968599196464e-05, "loss": 1.2202, "step": 16628 }, { "epoch": 0.45, "learning_rate": 1.1958818627548348e-05, "loss": 1.168, "step": 16629 }, { "epoch": 0.45, "learning_rate": 1.195795124780718e-05, "loss": 1.2957, "step": 16630 }, { "epoch": 0.45, "learning_rate": 1.1957083852747919e-05, "loss": 1.3989, "step": 16631 }, { "epoch": 0.45, "learning_rate": 1.195621644237736e-05, "loss": 1.283, "step": 16632 }, { "epoch": 0.45, "learning_rate": 1.1955349016702278e-05, "loss": 1.2649, "step": 16633 }, { "epoch": 0.45, "learning_rate": 1.1954481575729467e-05, "loss": 1.6655, "step": 16634 }, { "epoch": 0.45, "learning_rate": 1.195361411946571e-05, "loss": 1.2507, "step": 16635 }, { "epoch": 0.45, "learning_rate": 1.19527466479178e-05, "loss": 1.4341, "step": 16636 }, { "epoch": 0.45, "learning_rate": 1.1951879161092513e-05, "loss": 1.3491, "step": 16637 }, { "epoch": 0.45, "learning_rate": 1.1951011658996644e-05, "loss": 1.4424, "step": 16638 }, { "epoch": 0.45, "learning_rate": 1.1950144141636975e-05, "loss": 1.2852, "step": 16639 }, { "epoch": 0.45, "learning_rate": 1.1949276609020298e-05, "loss": 1.3555, "step": 16640 }, { "epoch": 0.45, "learning_rate": 1.1948409061153394e-05, "loss": 1.1135, "step": 16641 }, { "epoch": 0.45, "learning_rate": 1.1947541498043056e-05, "loss": 1.2585, "step": 16642 }, { "epoch": 0.45, "learning_rate": 1.1946673919696068e-05, "loss": 1.157, "step": 16643 }, { "epoch": 0.45, "learning_rate": 1.1945806326119221e-05, "loss": 1.3271, "step": 16644 }, { "epoch": 0.45, "learning_rate": 1.1944938717319296e-05, "loss": 1.2466, "step": 16645 }, { "epoch": 0.45, "learning_rate": 1.1944071093303088e-05, "loss": 1.2671, "step": 16646 }, { "epoch": 0.45, "learning_rate": 1.1943203454077383e-05, "loss": 1.3403, "step": 16647 }, { "epoch": 0.45, "learning_rate": 1.1942335799648965e-05, "loss": 1.3145, "step": 16648 }, { "epoch": 0.45, "learning_rate": 1.1941468130024628e-05, "loss": 1.2859, "step": 16649 }, { "epoch": 0.45, "learning_rate": 1.1940600445211155e-05, "loss": 1.3638, "step": 16650 }, { "epoch": 0.45, "learning_rate": 1.1939732745215338e-05, "loss": 1.2524, "step": 16651 }, { "epoch": 0.45, "learning_rate": 1.1938865030043962e-05, "loss": 1.1233, "step": 16652 }, { "epoch": 0.45, "learning_rate": 1.1937997299703821e-05, "loss": 1.3413, "step": 16653 }, { "epoch": 0.45, "learning_rate": 1.1937129554201698e-05, "loss": 1.4146, "step": 16654 }, { "epoch": 0.45, "learning_rate": 1.1936261793544387e-05, "loss": 1.2766, "step": 16655 }, { "epoch": 0.45, "learning_rate": 1.193539401773867e-05, "loss": 1.1255, "step": 16656 }, { "epoch": 0.45, "learning_rate": 1.1934526226791345e-05, "loss": 1.2654, "step": 16657 }, { "epoch": 0.45, "learning_rate": 1.1933658420709194e-05, "loss": 1.2822, "step": 16658 }, { "epoch": 0.45, "learning_rate": 1.193279059949901e-05, "loss": 1.2461, "step": 16659 }, { "epoch": 0.45, "learning_rate": 1.1931922763167578e-05, "loss": 1.2761, "step": 16660 }, { "epoch": 0.46, "learning_rate": 1.1931054911721693e-05, "loss": 1.3359, "step": 16661 }, { "epoch": 0.46, "learning_rate": 1.1930187045168143e-05, "loss": 1.3342, "step": 16662 }, { "epoch": 0.46, "learning_rate": 1.1929319163513717e-05, "loss": 1.3508, "step": 16663 }, { "epoch": 0.46, "learning_rate": 1.1928451266765202e-05, "loss": 1.3882, "step": 16664 }, { "epoch": 0.46, "learning_rate": 1.1927583354929393e-05, "loss": 1.4087, "step": 16665 }, { "epoch": 0.46, "learning_rate": 1.1926715428013078e-05, "loss": 1.3003, "step": 16666 }, { "epoch": 0.46, "learning_rate": 1.192584748602305e-05, "loss": 1.2776, "step": 16667 }, { "epoch": 0.46, "learning_rate": 1.1924979528966095e-05, "loss": 1.1697, "step": 16668 }, { "epoch": 0.46, "learning_rate": 1.1924111556849006e-05, "loss": 1.3538, "step": 16669 }, { "epoch": 0.46, "learning_rate": 1.1923243569678574e-05, "loss": 1.2664, "step": 16670 }, { "epoch": 0.46, "learning_rate": 1.1922375567461586e-05, "loss": 1.1401, "step": 16671 }, { "epoch": 0.46, "learning_rate": 1.1921507550204837e-05, "loss": 1.3333, "step": 16672 }, { "epoch": 0.46, "learning_rate": 1.1920639517915117e-05, "loss": 1.2651, "step": 16673 }, { "epoch": 0.46, "learning_rate": 1.1919771470599215e-05, "loss": 1.1853, "step": 16674 }, { "epoch": 0.46, "learning_rate": 1.1918903408263924e-05, "loss": 1.2354, "step": 16675 }, { "epoch": 0.46, "learning_rate": 1.1918035330916036e-05, "loss": 1.1558, "step": 16676 }, { "epoch": 0.46, "learning_rate": 1.1917167238562342e-05, "loss": 1.3699, "step": 16677 }, { "epoch": 0.46, "learning_rate": 1.1916299131209632e-05, "loss": 1.687, "step": 16678 }, { "epoch": 0.46, "learning_rate": 1.1915431008864697e-05, "loss": 1.2661, "step": 16679 }, { "epoch": 0.46, "learning_rate": 1.1914562871534331e-05, "loss": 1.2461, "step": 16680 }, { "epoch": 0.46, "learning_rate": 1.1913694719225328e-05, "loss": 1.4509, "step": 16681 }, { "epoch": 0.46, "learning_rate": 1.1912826551944476e-05, "loss": 1.3831, "step": 16682 }, { "epoch": 0.46, "learning_rate": 1.1911958369698569e-05, "loss": 1.4248, "step": 16683 }, { "epoch": 0.46, "learning_rate": 1.1911090172494397e-05, "loss": 1.3367, "step": 16684 }, { "epoch": 0.46, "learning_rate": 1.1910221960338756e-05, "loss": 1.3152, "step": 16685 }, { "epoch": 0.46, "learning_rate": 1.1909353733238436e-05, "loss": 1.1902, "step": 16686 }, { "epoch": 0.46, "learning_rate": 1.1908485491200232e-05, "loss": 1.2064, "step": 16687 }, { "epoch": 0.46, "learning_rate": 1.1907617234230933e-05, "loss": 1.179, "step": 16688 }, { "epoch": 0.46, "learning_rate": 1.1906748962337335e-05, "loss": 1.3716, "step": 16689 }, { "epoch": 0.46, "learning_rate": 1.1905880675526229e-05, "loss": 1.4104, "step": 16690 }, { "epoch": 0.46, "learning_rate": 1.190501237380441e-05, "loss": 1.3108, "step": 16691 }, { "epoch": 0.46, "learning_rate": 1.1904144057178666e-05, "loss": 1.1768, "step": 16692 }, { "epoch": 0.46, "learning_rate": 1.1903275725655799e-05, "loss": 1.3779, "step": 16693 }, { "epoch": 0.46, "learning_rate": 1.1902407379242596e-05, "loss": 1.3582, "step": 16694 }, { "epoch": 0.46, "learning_rate": 1.190153901794585e-05, "loss": 1.3555, "step": 16695 }, { "epoch": 0.46, "learning_rate": 1.190067064177236e-05, "loss": 1.3022, "step": 16696 }, { "epoch": 0.46, "learning_rate": 1.1899802250728913e-05, "loss": 1.1612, "step": 16697 }, { "epoch": 0.46, "learning_rate": 1.189893384482231e-05, "loss": 1.301, "step": 16698 }, { "epoch": 0.46, "learning_rate": 1.1898065424059342e-05, "loss": 1.1624, "step": 16699 }, { "epoch": 0.46, "learning_rate": 1.1897196988446801e-05, "loss": 1.2754, "step": 16700 }, { "epoch": 0.46, "learning_rate": 1.1896328537991484e-05, "loss": 1.2249, "step": 16701 }, { "epoch": 0.46, "learning_rate": 1.1895460072700184e-05, "loss": 1.4175, "step": 16702 }, { "epoch": 0.46, "learning_rate": 1.1894591592579695e-05, "loss": 1.2258, "step": 16703 }, { "epoch": 0.46, "learning_rate": 1.189372309763681e-05, "loss": 1.2412, "step": 16704 }, { "epoch": 0.46, "learning_rate": 1.1892854587878328e-05, "loss": 1.1055, "step": 16705 }, { "epoch": 0.46, "learning_rate": 1.1891986063311045e-05, "loss": 1.4058, "step": 16706 }, { "epoch": 0.46, "learning_rate": 1.1891117523941749e-05, "loss": 1.2415, "step": 16707 }, { "epoch": 0.46, "learning_rate": 1.189024896977724e-05, "loss": 1.3699, "step": 16708 }, { "epoch": 0.46, "learning_rate": 1.188938040082431e-05, "loss": 1.312, "step": 16709 }, { "epoch": 0.46, "learning_rate": 1.1888511817089756e-05, "loss": 1.2957, "step": 16710 }, { "epoch": 0.46, "learning_rate": 1.1887643218580376e-05, "loss": 1.3796, "step": 16711 }, { "epoch": 0.46, "learning_rate": 1.1886774605302965e-05, "loss": 1.3135, "step": 16712 }, { "epoch": 0.46, "learning_rate": 1.1885905977264312e-05, "loss": 1.3413, "step": 16713 }, { "epoch": 0.46, "learning_rate": 1.188503733447122e-05, "loss": 1.3633, "step": 16714 }, { "epoch": 0.46, "learning_rate": 1.1884168676930481e-05, "loss": 1.333, "step": 16715 }, { "epoch": 0.46, "learning_rate": 1.1883300004648895e-05, "loss": 1.1637, "step": 16716 }, { "epoch": 0.46, "learning_rate": 1.1882431317633252e-05, "loss": 1.0693, "step": 16717 }, { "epoch": 0.46, "learning_rate": 1.1881562615890354e-05, "loss": 1.4385, "step": 16718 }, { "epoch": 0.46, "learning_rate": 1.1880693899426992e-05, "loss": 1.3042, "step": 16719 }, { "epoch": 0.46, "learning_rate": 1.187982516824997e-05, "loss": 1.3621, "step": 16720 }, { "epoch": 0.46, "learning_rate": 1.1878956422366075e-05, "loss": 1.3511, "step": 16721 }, { "epoch": 0.46, "learning_rate": 1.1878087661782112e-05, "loss": 1.3579, "step": 16722 }, { "epoch": 0.46, "learning_rate": 1.187721888650487e-05, "loss": 1.4221, "step": 16723 }, { "epoch": 0.46, "learning_rate": 1.1876350096541156e-05, "loss": 1.4072, "step": 16724 }, { "epoch": 0.46, "learning_rate": 1.1875481291897757e-05, "loss": 1.3914, "step": 16725 }, { "epoch": 0.46, "learning_rate": 1.1874612472581475e-05, "loss": 1.3049, "step": 16726 }, { "epoch": 0.46, "learning_rate": 1.1873743638599105e-05, "loss": 1.2075, "step": 16727 }, { "epoch": 0.46, "learning_rate": 1.187287478995745e-05, "loss": 1.343, "step": 16728 }, { "epoch": 0.46, "learning_rate": 1.1872005926663298e-05, "loss": 1.2632, "step": 16729 }, { "epoch": 0.46, "learning_rate": 1.1871137048723458e-05, "loss": 1.4272, "step": 16730 }, { "epoch": 0.46, "learning_rate": 1.1870268156144718e-05, "loss": 1.2485, "step": 16731 }, { "epoch": 0.46, "learning_rate": 1.186939924893388e-05, "loss": 1.2554, "step": 16732 }, { "epoch": 0.46, "learning_rate": 1.186853032709774e-05, "loss": 1.2051, "step": 16733 }, { "epoch": 0.46, "learning_rate": 1.18676613906431e-05, "loss": 1.2869, "step": 16734 }, { "epoch": 0.46, "learning_rate": 1.1866792439576753e-05, "loss": 1.373, "step": 16735 }, { "epoch": 0.46, "learning_rate": 1.1865923473905504e-05, "loss": 1.363, "step": 16736 }, { "epoch": 0.46, "learning_rate": 1.1865054493636141e-05, "loss": 1.2151, "step": 16737 }, { "epoch": 0.46, "learning_rate": 1.1864185498775473e-05, "loss": 1.3303, "step": 16738 }, { "epoch": 0.46, "learning_rate": 1.1863316489330292e-05, "loss": 1.3838, "step": 16739 }, { "epoch": 0.46, "learning_rate": 1.1862447465307402e-05, "loss": 1.248, "step": 16740 }, { "epoch": 0.46, "learning_rate": 1.1861578426713596e-05, "loss": 1.3013, "step": 16741 }, { "epoch": 0.46, "learning_rate": 1.1860709373555676e-05, "loss": 1.2942, "step": 16742 }, { "epoch": 0.46, "learning_rate": 1.1859840305840442e-05, "loss": 1.1731, "step": 16743 }, { "epoch": 0.46, "learning_rate": 1.185897122357469e-05, "loss": 1.3052, "step": 16744 }, { "epoch": 0.46, "learning_rate": 1.1858102126765226e-05, "loss": 1.6167, "step": 16745 }, { "epoch": 0.46, "learning_rate": 1.1857233015418838e-05, "loss": 1.3269, "step": 16746 }, { "epoch": 0.46, "learning_rate": 1.1856363889542337e-05, "loss": 1.2471, "step": 16747 }, { "epoch": 0.46, "learning_rate": 1.1855494749142517e-05, "loss": 1.375, "step": 16748 }, { "epoch": 0.46, "learning_rate": 1.1854625594226178e-05, "loss": 1.4573, "step": 16749 }, { "epoch": 0.46, "learning_rate": 1.185375642480012e-05, "loss": 1.3337, "step": 16750 }, { "epoch": 0.46, "learning_rate": 1.1852887240871145e-05, "loss": 1.1975, "step": 16751 }, { "epoch": 0.46, "learning_rate": 1.185201804244605e-05, "loss": 1.3086, "step": 16752 }, { "epoch": 0.46, "learning_rate": 1.1851148829531638e-05, "loss": 1.1167, "step": 16753 }, { "epoch": 0.46, "learning_rate": 1.1850279602134707e-05, "loss": 1.2979, "step": 16754 }, { "epoch": 0.46, "learning_rate": 1.1849410360262058e-05, "loss": 1.4131, "step": 16755 }, { "epoch": 0.46, "learning_rate": 1.1848541103920494e-05, "loss": 1.3098, "step": 16756 }, { "epoch": 0.46, "learning_rate": 1.1847671833116812e-05, "loss": 1.2339, "step": 16757 }, { "epoch": 0.46, "learning_rate": 1.1846802547857814e-05, "loss": 1.2358, "step": 16758 }, { "epoch": 0.46, "learning_rate": 1.1845933248150302e-05, "loss": 1.0328, "step": 16759 }, { "epoch": 0.46, "learning_rate": 1.1845063934001076e-05, "loss": 1.3083, "step": 16760 }, { "epoch": 0.46, "learning_rate": 1.1844194605416939e-05, "loss": 1.3628, "step": 16761 }, { "epoch": 0.46, "learning_rate": 1.1843325262404689e-05, "loss": 1.2886, "step": 16762 }, { "epoch": 0.46, "learning_rate": 1.1842455904971132e-05, "loss": 1.1975, "step": 16763 }, { "epoch": 0.46, "learning_rate": 1.1841586533123062e-05, "loss": 1.3735, "step": 16764 }, { "epoch": 0.46, "learning_rate": 1.1840717146867286e-05, "loss": 1.3843, "step": 16765 }, { "epoch": 0.46, "learning_rate": 1.1839847746210604e-05, "loss": 1.27, "step": 16766 }, { "epoch": 0.46, "learning_rate": 1.183897833115982e-05, "loss": 1.3677, "step": 16767 }, { "epoch": 0.46, "learning_rate": 1.1838108901721734e-05, "loss": 1.3037, "step": 16768 }, { "epoch": 0.46, "learning_rate": 1.1837239457903149e-05, "loss": 1.4248, "step": 16769 }, { "epoch": 0.46, "learning_rate": 1.1836369999710866e-05, "loss": 1.1654, "step": 16770 }, { "epoch": 0.46, "learning_rate": 1.1835500527151689e-05, "loss": 1.1665, "step": 16771 }, { "epoch": 0.46, "learning_rate": 1.1834631040232413e-05, "loss": 1.3115, "step": 16772 }, { "epoch": 0.46, "learning_rate": 1.1833761538959851e-05, "loss": 1.3228, "step": 16773 }, { "epoch": 0.46, "learning_rate": 1.18328920233408e-05, "loss": 1.3013, "step": 16774 }, { "epoch": 0.46, "learning_rate": 1.1832022493382067e-05, "loss": 1.3948, "step": 16775 }, { "epoch": 0.46, "learning_rate": 1.1831152949090448e-05, "loss": 1.3154, "step": 16776 }, { "epoch": 0.46, "learning_rate": 1.183028339047275e-05, "loss": 1.2366, "step": 16777 }, { "epoch": 0.46, "learning_rate": 1.1829413817535775e-05, "loss": 1.1052, "step": 16778 }, { "epoch": 0.46, "learning_rate": 1.182854423028633e-05, "loss": 1.3237, "step": 16779 }, { "epoch": 0.46, "learning_rate": 1.1827674628731209e-05, "loss": 1.3757, "step": 16780 }, { "epoch": 0.46, "learning_rate": 1.1826805012877227e-05, "loss": 1.2305, "step": 16781 }, { "epoch": 0.46, "learning_rate": 1.1825935382731177e-05, "loss": 1.4185, "step": 16782 }, { "epoch": 0.46, "learning_rate": 1.182506573829987e-05, "loss": 1.3977, "step": 16783 }, { "epoch": 0.46, "learning_rate": 1.1824196079590104e-05, "loss": 1.3008, "step": 16784 }, { "epoch": 0.46, "learning_rate": 1.182332640660869e-05, "loss": 1.3547, "step": 16785 }, { "epoch": 0.46, "learning_rate": 1.1822456719362423e-05, "loss": 1.3572, "step": 16786 }, { "epoch": 0.46, "learning_rate": 1.1821587017858116e-05, "loss": 1.3289, "step": 16787 }, { "epoch": 0.46, "learning_rate": 1.1820717302102564e-05, "loss": 1.343, "step": 16788 }, { "epoch": 0.46, "learning_rate": 1.1819847572102578e-05, "loss": 1.7144, "step": 16789 }, { "epoch": 0.46, "learning_rate": 1.1818977827864961e-05, "loss": 1.3906, "step": 16790 }, { "epoch": 0.46, "learning_rate": 1.1818108069396516e-05, "loss": 1.2893, "step": 16791 }, { "epoch": 0.46, "learning_rate": 1.181723829670405e-05, "loss": 1.3809, "step": 16792 }, { "epoch": 0.46, "learning_rate": 1.1816368509794365e-05, "loss": 1.1873, "step": 16793 }, { "epoch": 0.46, "learning_rate": 1.1815498708674266e-05, "loss": 1.228, "step": 16794 }, { "epoch": 0.46, "learning_rate": 1.181462889335056e-05, "loss": 1.3398, "step": 16795 }, { "epoch": 0.46, "learning_rate": 1.1813759063830053e-05, "loss": 1.2693, "step": 16796 }, { "epoch": 0.46, "learning_rate": 1.1812889220119546e-05, "loss": 1.3665, "step": 16797 }, { "epoch": 0.46, "learning_rate": 1.1812019362225844e-05, "loss": 1.8301, "step": 16798 }, { "epoch": 0.46, "learning_rate": 1.1811149490155758e-05, "loss": 1.2366, "step": 16799 }, { "epoch": 0.46, "learning_rate": 1.1810279603916089e-05, "loss": 1.3938, "step": 16800 }, { "epoch": 0.46, "learning_rate": 1.1809409703513643e-05, "loss": 1.2288, "step": 16801 }, { "epoch": 0.46, "learning_rate": 1.1808539788955224e-05, "loss": 1.3291, "step": 16802 }, { "epoch": 0.46, "learning_rate": 1.1807669860247643e-05, "loss": 1.0671, "step": 16803 }, { "epoch": 0.46, "learning_rate": 1.1806799917397705e-05, "loss": 1.4019, "step": 16804 }, { "epoch": 0.46, "learning_rate": 1.1805929960412208e-05, "loss": 1.4121, "step": 16805 }, { "epoch": 0.46, "learning_rate": 1.180505998929797e-05, "loss": 1.2263, "step": 16806 }, { "epoch": 0.46, "learning_rate": 1.1804190004061788e-05, "loss": 1.3501, "step": 16807 }, { "epoch": 0.46, "learning_rate": 1.1803320004710475e-05, "loss": 1.2566, "step": 16808 }, { "epoch": 0.46, "learning_rate": 1.180244999125083e-05, "loss": 1.3882, "step": 16809 }, { "epoch": 0.46, "learning_rate": 1.1801579963689669e-05, "loss": 1.0339, "step": 16810 }, { "epoch": 0.46, "learning_rate": 1.1800709922033788e-05, "loss": 1.4709, "step": 16811 }, { "epoch": 0.46, "learning_rate": 1.1799839866290004e-05, "loss": 1.2688, "step": 16812 }, { "epoch": 0.46, "learning_rate": 1.1798969796465116e-05, "loss": 1.3218, "step": 16813 }, { "epoch": 0.46, "learning_rate": 1.1798099712565939e-05, "loss": 1.4561, "step": 16814 }, { "epoch": 0.46, "learning_rate": 1.1797229614599269e-05, "loss": 1.4492, "step": 16815 }, { "epoch": 0.46, "learning_rate": 1.1796359502571924e-05, "loss": 1.2314, "step": 16816 }, { "epoch": 0.46, "learning_rate": 1.1795489376490706e-05, "loss": 1.3347, "step": 16817 }, { "epoch": 0.46, "learning_rate": 1.179461923636242e-05, "loss": 1.3562, "step": 16818 }, { "epoch": 0.46, "learning_rate": 1.179374908219388e-05, "loss": 1.3435, "step": 16819 }, { "epoch": 0.46, "learning_rate": 1.1792878913991893e-05, "loss": 1.3223, "step": 16820 }, { "epoch": 0.46, "learning_rate": 1.1792008731763258e-05, "loss": 1.3762, "step": 16821 }, { "epoch": 0.46, "learning_rate": 1.1791138535514794e-05, "loss": 1.1921, "step": 16822 }, { "epoch": 0.46, "learning_rate": 1.1790268325253305e-05, "loss": 1.1643, "step": 16823 }, { "epoch": 0.46, "learning_rate": 1.1789398100985596e-05, "loss": 1.1296, "step": 16824 }, { "epoch": 0.46, "learning_rate": 1.1788527862718479e-05, "loss": 1.2778, "step": 16825 }, { "epoch": 0.46, "learning_rate": 1.1787657610458762e-05, "loss": 1.2144, "step": 16826 }, { "epoch": 0.46, "learning_rate": 1.1786787344213251e-05, "loss": 1.334, "step": 16827 }, { "epoch": 0.46, "learning_rate": 1.1785917063988757e-05, "loss": 1.3516, "step": 16828 }, { "epoch": 0.46, "learning_rate": 1.1785046769792086e-05, "loss": 1.2454, "step": 16829 }, { "epoch": 0.46, "learning_rate": 1.178417646163005e-05, "loss": 1.355, "step": 16830 }, { "epoch": 0.46, "learning_rate": 1.1783306139509456e-05, "loss": 1.4058, "step": 16831 }, { "epoch": 0.46, "learning_rate": 1.1782435803437113e-05, "loss": 1.3792, "step": 16832 }, { "epoch": 0.46, "learning_rate": 1.178156545341983e-05, "loss": 1.2239, "step": 16833 }, { "epoch": 0.46, "learning_rate": 1.1780695089464418e-05, "loss": 1.2251, "step": 16834 }, { "epoch": 0.46, "learning_rate": 1.177982471157768e-05, "loss": 1.2429, "step": 16835 }, { "epoch": 0.46, "learning_rate": 1.1778954319766438e-05, "loss": 1.4485, "step": 16836 }, { "epoch": 0.46, "learning_rate": 1.177808391403749e-05, "loss": 1.2634, "step": 16837 }, { "epoch": 0.46, "learning_rate": 1.177721349439765e-05, "loss": 1.3154, "step": 16838 }, { "epoch": 0.46, "learning_rate": 1.1776343060853727e-05, "loss": 1.4155, "step": 16839 }, { "epoch": 0.46, "learning_rate": 1.1775472613412534e-05, "loss": 1.3567, "step": 16840 }, { "epoch": 0.46, "learning_rate": 1.1774602152080874e-05, "loss": 1.1187, "step": 16841 }, { "epoch": 0.46, "learning_rate": 1.1773731676865565e-05, "loss": 1.7188, "step": 16842 }, { "epoch": 0.46, "learning_rate": 1.177286118777341e-05, "loss": 1.335, "step": 16843 }, { "epoch": 0.46, "learning_rate": 1.1771990684811226e-05, "loss": 1.3391, "step": 16844 }, { "epoch": 0.46, "learning_rate": 1.1771120167985817e-05, "loss": 1.4014, "step": 16845 }, { "epoch": 0.46, "learning_rate": 1.1770249637303998e-05, "loss": 1.147, "step": 16846 }, { "epoch": 0.46, "learning_rate": 1.1769379092772577e-05, "loss": 1.1726, "step": 16847 }, { "epoch": 0.46, "learning_rate": 1.1768508534398368e-05, "loss": 1.3396, "step": 16848 }, { "epoch": 0.46, "learning_rate": 1.176763796218818e-05, "loss": 1.2664, "step": 16849 }, { "epoch": 0.46, "learning_rate": 1.176676737614882e-05, "loss": 1.2358, "step": 16850 }, { "epoch": 0.46, "learning_rate": 1.1765896776287107e-05, "loss": 1.4102, "step": 16851 }, { "epoch": 0.46, "learning_rate": 1.1765026162609847e-05, "loss": 1.3755, "step": 16852 }, { "epoch": 0.46, "learning_rate": 1.1764155535123854e-05, "loss": 1.2854, "step": 16853 }, { "epoch": 0.46, "learning_rate": 1.1763284893835933e-05, "loss": 1.4004, "step": 16854 }, { "epoch": 0.46, "learning_rate": 1.1762414238752903e-05, "loss": 1.4062, "step": 16855 }, { "epoch": 0.46, "learning_rate": 1.1761543569881573e-05, "loss": 1.3545, "step": 16856 }, { "epoch": 0.46, "learning_rate": 1.1760672887228754e-05, "loss": 1.3799, "step": 16857 }, { "epoch": 0.46, "learning_rate": 1.1759802190801257e-05, "loss": 1.2671, "step": 16858 }, { "epoch": 0.46, "learning_rate": 1.17589314806059e-05, "loss": 1.3069, "step": 16859 }, { "epoch": 0.46, "learning_rate": 1.1758060756649482e-05, "loss": 1.3564, "step": 16860 }, { "epoch": 0.46, "learning_rate": 1.1757190018938829e-05, "loss": 1.093, "step": 16861 }, { "epoch": 0.46, "learning_rate": 1.1756319267480746e-05, "loss": 1.4497, "step": 16862 }, { "epoch": 0.46, "learning_rate": 1.1755448502282048e-05, "loss": 1.2363, "step": 16863 }, { "epoch": 0.46, "learning_rate": 1.1754577723349547e-05, "loss": 1.4241, "step": 16864 }, { "epoch": 0.46, "learning_rate": 1.1753706930690052e-05, "loss": 1.2588, "step": 16865 }, { "epoch": 0.46, "learning_rate": 1.1752836124310381e-05, "loss": 1.2239, "step": 16866 }, { "epoch": 0.46, "learning_rate": 1.1751965304217343e-05, "loss": 1.2612, "step": 16867 }, { "epoch": 0.46, "learning_rate": 1.1751094470417754e-05, "loss": 1.3845, "step": 16868 }, { "epoch": 0.46, "learning_rate": 1.1750223622918424e-05, "loss": 1.2615, "step": 16869 }, { "epoch": 0.46, "learning_rate": 1.1749352761726167e-05, "loss": 1.2009, "step": 16870 }, { "epoch": 0.46, "learning_rate": 1.17484818868478e-05, "loss": 1.3513, "step": 16871 }, { "epoch": 0.46, "learning_rate": 1.174761099829013e-05, "loss": 1.0974, "step": 16872 }, { "epoch": 0.46, "learning_rate": 1.1746740096059974e-05, "loss": 1.3425, "step": 16873 }, { "epoch": 0.46, "learning_rate": 1.1745869180164142e-05, "loss": 1.4077, "step": 16874 }, { "epoch": 0.46, "learning_rate": 1.1744998250609454e-05, "loss": 1.2659, "step": 16875 }, { "epoch": 0.46, "learning_rate": 1.174412730740272e-05, "loss": 1.427, "step": 16876 }, { "epoch": 0.46, "learning_rate": 1.1743256350550753e-05, "loss": 1.3303, "step": 16877 }, { "epoch": 0.46, "learning_rate": 1.1742385380060368e-05, "loss": 1.3213, "step": 16878 }, { "epoch": 0.46, "learning_rate": 1.1741514395938381e-05, "loss": 1.2722, "step": 16879 }, { "epoch": 0.46, "learning_rate": 1.1740643398191603e-05, "loss": 1.3121, "step": 16880 }, { "epoch": 0.46, "learning_rate": 1.1739772386826846e-05, "loss": 1.3474, "step": 16881 }, { "epoch": 0.46, "learning_rate": 1.1738901361850932e-05, "loss": 1.2896, "step": 16882 }, { "epoch": 0.46, "learning_rate": 1.173803032327067e-05, "loss": 1.2622, "step": 16883 }, { "epoch": 0.46, "learning_rate": 1.1737159271092877e-05, "loss": 1.4026, "step": 16884 }, { "epoch": 0.46, "learning_rate": 1.1736288205324366e-05, "loss": 1.4146, "step": 16885 }, { "epoch": 0.46, "learning_rate": 1.1735417125971952e-05, "loss": 1.4668, "step": 16886 }, { "epoch": 0.46, "learning_rate": 1.1734546033042454e-05, "loss": 1.333, "step": 16887 }, { "epoch": 0.46, "learning_rate": 1.173367492654268e-05, "loss": 1.3379, "step": 16888 }, { "epoch": 0.46, "learning_rate": 1.1732803806479451e-05, "loss": 1.3752, "step": 16889 }, { "epoch": 0.46, "learning_rate": 1.1731932672859578e-05, "loss": 1.3784, "step": 16890 }, { "epoch": 0.46, "learning_rate": 1.1731061525689879e-05, "loss": 1.2803, "step": 16891 }, { "epoch": 0.46, "learning_rate": 1.1730190364977167e-05, "loss": 1.3337, "step": 16892 }, { "epoch": 0.46, "learning_rate": 1.172931919072826e-05, "loss": 1.408, "step": 16893 }, { "epoch": 0.46, "learning_rate": 1.1728448002949974e-05, "loss": 1.2297, "step": 16894 }, { "epoch": 0.46, "learning_rate": 1.1727576801649124e-05, "loss": 1.3494, "step": 16895 }, { "epoch": 0.46, "learning_rate": 1.1726705586832521e-05, "loss": 1.2458, "step": 16896 }, { "epoch": 0.46, "learning_rate": 1.1725834358506988e-05, "loss": 1.3569, "step": 16897 }, { "epoch": 0.46, "learning_rate": 1.172496311667934e-05, "loss": 1.3877, "step": 16898 }, { "epoch": 0.46, "learning_rate": 1.1724091861356392e-05, "loss": 1.1614, "step": 16899 }, { "epoch": 0.46, "learning_rate": 1.1723220592544959e-05, "loss": 1.3208, "step": 16900 }, { "epoch": 0.46, "learning_rate": 1.172234931025186e-05, "loss": 1.2913, "step": 16901 }, { "epoch": 0.46, "learning_rate": 1.1721478014483907e-05, "loss": 1.2676, "step": 16902 }, { "epoch": 0.46, "learning_rate": 1.1720606705247922e-05, "loss": 1.6987, "step": 16903 }, { "epoch": 0.46, "learning_rate": 1.1719735382550716e-05, "loss": 1.2473, "step": 16904 }, { "epoch": 0.46, "learning_rate": 1.1718864046399112e-05, "loss": 1.3374, "step": 16905 }, { "epoch": 0.46, "learning_rate": 1.1717992696799923e-05, "loss": 1.2498, "step": 16906 }, { "epoch": 0.46, "learning_rate": 1.1717121333759966e-05, "loss": 1.3123, "step": 16907 }, { "epoch": 0.46, "learning_rate": 1.1716249957286061e-05, "loss": 1.4426, "step": 16908 }, { "epoch": 0.46, "learning_rate": 1.1715378567385023e-05, "loss": 1.217, "step": 16909 }, { "epoch": 0.46, "learning_rate": 1.1714507164063668e-05, "loss": 1.3523, "step": 16910 }, { "epoch": 0.46, "learning_rate": 1.1713635747328817e-05, "loss": 1.4653, "step": 16911 }, { "epoch": 0.46, "learning_rate": 1.1712764317187283e-05, "loss": 1.2905, "step": 16912 }, { "epoch": 0.46, "learning_rate": 1.171189287364589e-05, "loss": 1.3574, "step": 16913 }, { "epoch": 0.46, "learning_rate": 1.171102141671145e-05, "loss": 1.2566, "step": 16914 }, { "epoch": 0.46, "learning_rate": 1.1710149946390783e-05, "loss": 1.3022, "step": 16915 }, { "epoch": 0.46, "learning_rate": 1.170927846269071e-05, "loss": 1.2888, "step": 16916 }, { "epoch": 0.46, "learning_rate": 1.1708406965618042e-05, "loss": 1.2939, "step": 16917 }, { "epoch": 0.46, "learning_rate": 1.1707535455179604e-05, "loss": 1.3105, "step": 16918 }, { "epoch": 0.46, "learning_rate": 1.1706663931382209e-05, "loss": 1.3882, "step": 16919 }, { "epoch": 0.46, "learning_rate": 1.1705792394232682e-05, "loss": 1.2202, "step": 16920 }, { "epoch": 0.46, "learning_rate": 1.1704920843737833e-05, "loss": 1.2271, "step": 16921 }, { "epoch": 0.46, "learning_rate": 1.1704049279904488e-05, "loss": 1.4287, "step": 16922 }, { "epoch": 0.46, "learning_rate": 1.170317770273946e-05, "loss": 1.3, "step": 16923 }, { "epoch": 0.46, "learning_rate": 1.1702306112249575e-05, "loss": 1.3237, "step": 16924 }, { "epoch": 0.46, "learning_rate": 1.1701434508441643e-05, "loss": 1.4136, "step": 16925 }, { "epoch": 0.46, "learning_rate": 1.1700562891322491e-05, "loss": 1.4429, "step": 16926 }, { "epoch": 0.46, "learning_rate": 1.1699691260898929e-05, "loss": 1.2449, "step": 16927 }, { "epoch": 0.46, "learning_rate": 1.1698819617177786e-05, "loss": 1.2705, "step": 16928 }, { "epoch": 0.46, "learning_rate": 1.1697947960165877e-05, "loss": 1.2698, "step": 16929 }, { "epoch": 0.46, "learning_rate": 1.1697076289870022e-05, "loss": 1.1865, "step": 16930 }, { "epoch": 0.46, "learning_rate": 1.169620460629704e-05, "loss": 1.6304, "step": 16931 }, { "epoch": 0.46, "learning_rate": 1.169533290945375e-05, "loss": 1.0786, "step": 16932 }, { "epoch": 0.46, "learning_rate": 1.1694461199346971e-05, "loss": 1.0642, "step": 16933 }, { "epoch": 0.46, "learning_rate": 1.1693589475983527e-05, "loss": 1.3804, "step": 16934 }, { "epoch": 0.46, "learning_rate": 1.1692717739370234e-05, "loss": 1.158, "step": 16935 }, { "epoch": 0.46, "learning_rate": 1.1691845989513915e-05, "loss": 1.3633, "step": 16936 }, { "epoch": 0.46, "learning_rate": 1.1690974226421386e-05, "loss": 1.2649, "step": 16937 }, { "epoch": 0.46, "learning_rate": 1.1690102450099472e-05, "loss": 1.3386, "step": 16938 }, { "epoch": 0.46, "learning_rate": 1.1689230660554988e-05, "loss": 1.3608, "step": 16939 }, { "epoch": 0.46, "learning_rate": 1.1688358857794762e-05, "loss": 1.2847, "step": 16940 }, { "epoch": 0.46, "learning_rate": 1.1687487041825607e-05, "loss": 1.0902, "step": 16941 }, { "epoch": 0.46, "learning_rate": 1.168661521265435e-05, "loss": 1.3242, "step": 16942 }, { "epoch": 0.46, "learning_rate": 1.1685743370287803e-05, "loss": 1.4563, "step": 16943 }, { "epoch": 0.46, "learning_rate": 1.1684871514732799e-05, "loss": 1.2893, "step": 16944 }, { "epoch": 0.46, "learning_rate": 1.1683999645996146e-05, "loss": 1.1541, "step": 16945 }, { "epoch": 0.46, "learning_rate": 1.1683127764084678e-05, "loss": 1.2932, "step": 16946 }, { "epoch": 0.46, "learning_rate": 1.1682255869005206e-05, "loss": 1.2009, "step": 16947 }, { "epoch": 0.46, "learning_rate": 1.1681383960764559e-05, "loss": 1.2122, "step": 16948 }, { "epoch": 0.46, "learning_rate": 1.168051203936955e-05, "loss": 1.3022, "step": 16949 }, { "epoch": 0.46, "learning_rate": 1.1679640104827009e-05, "loss": 1.3192, "step": 16950 }, { "epoch": 0.46, "learning_rate": 1.167876815714375e-05, "loss": 1.2629, "step": 16951 }, { "epoch": 0.46, "learning_rate": 1.1677896196326602e-05, "loss": 1.2888, "step": 16952 }, { "epoch": 0.46, "learning_rate": 1.167702422238238e-05, "loss": 1.3567, "step": 16953 }, { "epoch": 0.46, "learning_rate": 1.167615223531791e-05, "loss": 1.3042, "step": 16954 }, { "epoch": 0.46, "learning_rate": 1.1675280235140014e-05, "loss": 1.179, "step": 16955 }, { "epoch": 0.46, "learning_rate": 1.1674408221855513e-05, "loss": 1.2974, "step": 16956 }, { "epoch": 0.46, "learning_rate": 1.1673536195471228e-05, "loss": 1.2915, "step": 16957 }, { "epoch": 0.46, "learning_rate": 1.1672664155993984e-05, "loss": 1.7251, "step": 16958 }, { "epoch": 0.46, "learning_rate": 1.16717921034306e-05, "loss": 1.1562, "step": 16959 }, { "epoch": 0.46, "learning_rate": 1.1670920037787903e-05, "loss": 1.241, "step": 16960 }, { "epoch": 0.46, "learning_rate": 1.1670047959072714e-05, "loss": 1.5366, "step": 16961 }, { "epoch": 0.46, "learning_rate": 1.1669175867291853e-05, "loss": 1.2219, "step": 16962 }, { "epoch": 0.46, "learning_rate": 1.1668303762452147e-05, "loss": 1.3098, "step": 16963 }, { "epoch": 0.46, "learning_rate": 1.1667431644560417e-05, "loss": 1.3679, "step": 16964 }, { "epoch": 0.46, "learning_rate": 1.1666559513623483e-05, "loss": 1.3269, "step": 16965 }, { "epoch": 0.46, "learning_rate": 1.1665687369648174e-05, "loss": 1.109, "step": 16966 }, { "epoch": 0.46, "learning_rate": 1.166481521264131e-05, "loss": 1.302, "step": 16967 }, { "epoch": 0.46, "learning_rate": 1.166394304260971e-05, "loss": 1.2881, "step": 16968 }, { "epoch": 0.46, "learning_rate": 1.1663070859560209e-05, "loss": 1.2844, "step": 16969 }, { "epoch": 0.46, "learning_rate": 1.166219866349962e-05, "loss": 1.3152, "step": 16970 }, { "epoch": 0.46, "learning_rate": 1.1661326454434771e-05, "loss": 1.4148, "step": 16971 }, { "epoch": 0.46, "learning_rate": 1.1660454232372485e-05, "loss": 1.3921, "step": 16972 }, { "epoch": 0.46, "learning_rate": 1.1659581997319585e-05, "loss": 1.521, "step": 16973 }, { "epoch": 0.46, "learning_rate": 1.1658709749282892e-05, "loss": 1.3784, "step": 16974 }, { "epoch": 0.46, "learning_rate": 1.1657837488269242e-05, "loss": 1.2864, "step": 16975 }, { "epoch": 0.46, "learning_rate": 1.1656965214285446e-05, "loss": 1.1565, "step": 16976 }, { "epoch": 0.46, "learning_rate": 1.1656092927338337e-05, "loss": 1.3604, "step": 16977 }, { "epoch": 0.46, "learning_rate": 1.165522062743473e-05, "loss": 1.0541, "step": 16978 }, { "epoch": 0.46, "learning_rate": 1.1654348314581461e-05, "loss": 1.2954, "step": 16979 }, { "epoch": 0.46, "learning_rate": 1.1653475988785345e-05, "loss": 1.2056, "step": 16980 }, { "epoch": 0.46, "learning_rate": 1.1652603650053212e-05, "loss": 1.1958, "step": 16981 }, { "epoch": 0.46, "learning_rate": 1.1651731298391884e-05, "loss": 1.377, "step": 16982 }, { "epoch": 0.46, "learning_rate": 1.1650858933808189e-05, "loss": 1.0952, "step": 16983 }, { "epoch": 0.46, "learning_rate": 1.1649986556308948e-05, "loss": 1.2747, "step": 16984 }, { "epoch": 0.46, "learning_rate": 1.164911416590099e-05, "loss": 1.1509, "step": 16985 }, { "epoch": 0.46, "learning_rate": 1.1648241762591135e-05, "loss": 1.3398, "step": 16986 }, { "epoch": 0.46, "learning_rate": 1.1647369346386217e-05, "loss": 1.011, "step": 16987 }, { "epoch": 0.46, "learning_rate": 1.1646496917293051e-05, "loss": 1.394, "step": 16988 }, { "epoch": 0.46, "learning_rate": 1.1645624475318469e-05, "loss": 1.3267, "step": 16989 }, { "epoch": 0.46, "learning_rate": 1.1644752020469293e-05, "loss": 1.1187, "step": 16990 }, { "epoch": 0.46, "learning_rate": 1.1643879552752352e-05, "loss": 1.3193, "step": 16991 }, { "epoch": 0.46, "learning_rate": 1.164300707217447e-05, "loss": 1.2239, "step": 16992 }, { "epoch": 0.46, "learning_rate": 1.1642134578742474e-05, "loss": 1.3003, "step": 16993 }, { "epoch": 0.46, "learning_rate": 1.1641262072463188e-05, "loss": 1.1807, "step": 16994 }, { "epoch": 0.46, "learning_rate": 1.1640389553343442e-05, "loss": 1.2017, "step": 16995 }, { "epoch": 0.46, "learning_rate": 1.163951702139006e-05, "loss": 1.2869, "step": 16996 }, { "epoch": 0.46, "learning_rate": 1.1638644476609865e-05, "loss": 1.1799, "step": 16997 }, { "epoch": 0.46, "learning_rate": 1.1637771919009687e-05, "loss": 1.2573, "step": 16998 }, { "epoch": 0.46, "learning_rate": 1.1636899348596353e-05, "loss": 1.4021, "step": 16999 }, { "epoch": 0.46, "learning_rate": 1.1636026765376685e-05, "loss": 1.3103, "step": 17000 }, { "epoch": 0.46, "learning_rate": 1.1635154169357517e-05, "loss": 1.3594, "step": 17001 }, { "epoch": 0.46, "learning_rate": 1.1634281560545669e-05, "loss": 1.155, "step": 17002 }, { "epoch": 0.46, "learning_rate": 1.1633408938947972e-05, "loss": 1.3938, "step": 17003 }, { "epoch": 0.46, "learning_rate": 1.163253630457125e-05, "loss": 1.4233, "step": 17004 }, { "epoch": 0.46, "learning_rate": 1.163166365742233e-05, "loss": 1.2546, "step": 17005 }, { "epoch": 0.46, "learning_rate": 1.1630790997508044e-05, "loss": 1.334, "step": 17006 }, { "epoch": 0.46, "learning_rate": 1.1629918324835214e-05, "loss": 1.3376, "step": 17007 }, { "epoch": 0.46, "learning_rate": 1.1629045639410672e-05, "loss": 1.261, "step": 17008 }, { "epoch": 0.46, "learning_rate": 1.162817294124124e-05, "loss": 1.4114, "step": 17009 }, { "epoch": 0.46, "learning_rate": 1.1627300230333749e-05, "loss": 1.3835, "step": 17010 }, { "epoch": 0.46, "learning_rate": 1.1626427506695028e-05, "loss": 1.1948, "step": 17011 }, { "epoch": 0.46, "learning_rate": 1.1625554770331902e-05, "loss": 1.2981, "step": 17012 }, { "epoch": 0.46, "learning_rate": 1.1624682021251201e-05, "loss": 1.2014, "step": 17013 }, { "epoch": 0.46, "learning_rate": 1.1623809259459751e-05, "loss": 1.344, "step": 17014 }, { "epoch": 0.46, "learning_rate": 1.162293648496438e-05, "loss": 1.271, "step": 17015 }, { "epoch": 0.46, "learning_rate": 1.1622063697771919e-05, "loss": 1.2117, "step": 17016 }, { "epoch": 0.46, "learning_rate": 1.1621190897889194e-05, "loss": 1.2463, "step": 17017 }, { "epoch": 0.46, "learning_rate": 1.1620318085323032e-05, "loss": 1.4492, "step": 17018 }, { "epoch": 0.46, "learning_rate": 1.1619445260080264e-05, "loss": 1.2642, "step": 17019 }, { "epoch": 0.46, "learning_rate": 1.1618572422167717e-05, "loss": 1.3208, "step": 17020 }, { "epoch": 0.46, "learning_rate": 1.1617699571592222e-05, "loss": 1.2827, "step": 17021 }, { "epoch": 0.46, "learning_rate": 1.1616826708360608e-05, "loss": 1.2463, "step": 17022 }, { "epoch": 0.46, "learning_rate": 1.1615953832479698e-05, "loss": 1.1273, "step": 17023 }, { "epoch": 0.46, "learning_rate": 1.1615080943956327e-05, "loss": 1.2754, "step": 17024 }, { "epoch": 0.46, "learning_rate": 1.1614208042797324e-05, "loss": 1.1256, "step": 17025 }, { "epoch": 0.46, "learning_rate": 1.1613335129009515e-05, "loss": 1.2041, "step": 17026 }, { "epoch": 0.46, "learning_rate": 1.1612462202599727e-05, "loss": 1.3245, "step": 17027 }, { "epoch": 0.47, "learning_rate": 1.1611589263574799e-05, "loss": 1.2207, "step": 17028 }, { "epoch": 0.47, "learning_rate": 1.1610716311941551e-05, "loss": 1.3489, "step": 17029 }, { "epoch": 0.47, "learning_rate": 1.1609843347706818e-05, "loss": 1.0657, "step": 17030 }, { "epoch": 0.47, "learning_rate": 1.1608970370877425e-05, "loss": 1.1958, "step": 17031 }, { "epoch": 0.47, "learning_rate": 1.1608097381460205e-05, "loss": 1.2947, "step": 17032 }, { "epoch": 0.47, "learning_rate": 1.1607224379461987e-05, "loss": 1.3198, "step": 17033 }, { "epoch": 0.47, "learning_rate": 1.1606351364889604e-05, "loss": 1.2825, "step": 17034 }, { "epoch": 0.47, "learning_rate": 1.160547833774988e-05, "loss": 1.3125, "step": 17035 }, { "epoch": 0.47, "learning_rate": 1.160460529804965e-05, "loss": 1.2241, "step": 17036 }, { "epoch": 0.47, "learning_rate": 1.160373224579574e-05, "loss": 1.3174, "step": 17037 }, { "epoch": 0.47, "learning_rate": 1.1602859180994988e-05, "loss": 1.7217, "step": 17038 }, { "epoch": 0.47, "learning_rate": 1.1601986103654215e-05, "loss": 1.3379, "step": 17039 }, { "epoch": 0.47, "learning_rate": 1.1601113013780259e-05, "loss": 1.3823, "step": 17040 }, { "epoch": 0.47, "learning_rate": 1.1600239911379948e-05, "loss": 1.3513, "step": 17041 }, { "epoch": 0.47, "learning_rate": 1.159936679646011e-05, "loss": 1.3379, "step": 17042 }, { "epoch": 0.47, "learning_rate": 1.159849366902758e-05, "loss": 1.3379, "step": 17043 }, { "epoch": 0.47, "learning_rate": 1.1597620529089187e-05, "loss": 1.2285, "step": 17044 }, { "epoch": 0.47, "learning_rate": 1.159674737665176e-05, "loss": 1.502, "step": 17045 }, { "epoch": 0.47, "learning_rate": 1.1595874211722135e-05, "loss": 1.3987, "step": 17046 }, { "epoch": 0.47, "learning_rate": 1.1595001034307138e-05, "loss": 1.3896, "step": 17047 }, { "epoch": 0.47, "learning_rate": 1.1594127844413608e-05, "loss": 1.2529, "step": 17048 }, { "epoch": 0.47, "learning_rate": 1.1593254642048366e-05, "loss": 1.2849, "step": 17049 }, { "epoch": 0.47, "learning_rate": 1.1592381427218254e-05, "loss": 1.1835, "step": 17050 }, { "epoch": 0.47, "learning_rate": 1.1591508199930094e-05, "loss": 1.333, "step": 17051 }, { "epoch": 0.47, "learning_rate": 1.1590634960190722e-05, "loss": 1.1113, "step": 17052 }, { "epoch": 0.47, "learning_rate": 1.158976170800697e-05, "loss": 1.1821, "step": 17053 }, { "epoch": 0.47, "learning_rate": 1.1588888443385673e-05, "loss": 1.3989, "step": 17054 }, { "epoch": 0.47, "learning_rate": 1.1588015166333656e-05, "loss": 1.1941, "step": 17055 }, { "epoch": 0.47, "learning_rate": 1.1587141876857762e-05, "loss": 1.2754, "step": 17056 }, { "epoch": 0.47, "learning_rate": 1.158626857496481e-05, "loss": 1.2839, "step": 17057 }, { "epoch": 0.47, "learning_rate": 1.158539526066164e-05, "loss": 1.1821, "step": 17058 }, { "epoch": 0.47, "learning_rate": 1.1584521933955083e-05, "loss": 1.3229, "step": 17059 }, { "epoch": 0.47, "learning_rate": 1.1583648594851976e-05, "loss": 1.23, "step": 17060 }, { "epoch": 0.47, "learning_rate": 1.1582775243359139e-05, "loss": 1.3269, "step": 17061 }, { "epoch": 0.47, "learning_rate": 1.158190187948342e-05, "loss": 1.2952, "step": 17062 }, { "epoch": 0.47, "learning_rate": 1.158102850323164e-05, "loss": 1.1091, "step": 17063 }, { "epoch": 0.47, "learning_rate": 1.1580155114610639e-05, "loss": 1.1788, "step": 17064 }, { "epoch": 0.47, "learning_rate": 1.1579281713627246e-05, "loss": 1.4348, "step": 17065 }, { "epoch": 0.47, "learning_rate": 1.1578408300288295e-05, "loss": 1.2195, "step": 17066 }, { "epoch": 0.47, "learning_rate": 1.157753487460062e-05, "loss": 1.2544, "step": 17067 }, { "epoch": 0.47, "learning_rate": 1.1576661436571053e-05, "loss": 1.3823, "step": 17068 }, { "epoch": 0.47, "learning_rate": 1.1575787986206433e-05, "loss": 1.2212, "step": 17069 }, { "epoch": 0.47, "learning_rate": 1.1574914523513583e-05, "loss": 1.2644, "step": 17070 }, { "epoch": 0.47, "learning_rate": 1.1574041048499347e-05, "loss": 1.2976, "step": 17071 }, { "epoch": 0.47, "learning_rate": 1.157316756117055e-05, "loss": 1.1042, "step": 17072 }, { "epoch": 0.47, "learning_rate": 1.1572294061534033e-05, "loss": 1.3779, "step": 17073 }, { "epoch": 0.47, "learning_rate": 1.1571420549596624e-05, "loss": 1.4119, "step": 17074 }, { "epoch": 0.47, "learning_rate": 1.1570547025365161e-05, "loss": 1.3008, "step": 17075 }, { "epoch": 0.47, "learning_rate": 1.1569673488846478e-05, "loss": 1.2056, "step": 17076 }, { "epoch": 0.47, "learning_rate": 1.1568799940047406e-05, "loss": 1.2549, "step": 17077 }, { "epoch": 0.47, "learning_rate": 1.1567926378974781e-05, "loss": 1.2271, "step": 17078 }, { "epoch": 0.47, "learning_rate": 1.1567052805635437e-05, "loss": 1.7036, "step": 17079 }, { "epoch": 0.47, "learning_rate": 1.1566179220036209e-05, "loss": 1.2949, "step": 17080 }, { "epoch": 0.47, "learning_rate": 1.1565305622183933e-05, "loss": 1.397, "step": 17081 }, { "epoch": 0.47, "learning_rate": 1.1564432012085439e-05, "loss": 1.3384, "step": 17082 }, { "epoch": 0.47, "learning_rate": 1.1563558389747564e-05, "loss": 1.2227, "step": 17083 }, { "epoch": 0.47, "learning_rate": 1.1562684755177145e-05, "loss": 1.4463, "step": 17084 }, { "epoch": 0.47, "learning_rate": 1.1561811108381017e-05, "loss": 1.2383, "step": 17085 }, { "epoch": 0.47, "learning_rate": 1.156093744936601e-05, "loss": 1.2939, "step": 17086 }, { "epoch": 0.47, "learning_rate": 1.1560063778138965e-05, "loss": 1.2144, "step": 17087 }, { "epoch": 0.47, "learning_rate": 1.1559190094706714e-05, "loss": 1.3687, "step": 17088 }, { "epoch": 0.47, "learning_rate": 1.1558316399076093e-05, "loss": 1.3877, "step": 17089 }, { "epoch": 0.47, "learning_rate": 1.1557442691253938e-05, "loss": 1.3542, "step": 17090 }, { "epoch": 0.47, "learning_rate": 1.1556568971247083e-05, "loss": 1.3403, "step": 17091 }, { "epoch": 0.47, "learning_rate": 1.1555695239062364e-05, "loss": 1.3293, "step": 17092 }, { "epoch": 0.47, "learning_rate": 1.1554821494706615e-05, "loss": 1.3411, "step": 17093 }, { "epoch": 0.47, "learning_rate": 1.1553947738186677e-05, "loss": 1.2473, "step": 17094 }, { "epoch": 0.47, "learning_rate": 1.1553073969509382e-05, "loss": 1.3281, "step": 17095 }, { "epoch": 0.47, "learning_rate": 1.1552200188681565e-05, "loss": 1.1125, "step": 17096 }, { "epoch": 0.47, "learning_rate": 1.1551326395710066e-05, "loss": 1.3887, "step": 17097 }, { "epoch": 0.47, "learning_rate": 1.1550452590601714e-05, "loss": 1.2383, "step": 17098 }, { "epoch": 0.47, "learning_rate": 1.1549578773363355e-05, "loss": 1.1196, "step": 17099 }, { "epoch": 0.47, "learning_rate": 1.1548704944001819e-05, "loss": 1.2227, "step": 17100 }, { "epoch": 0.47, "learning_rate": 1.1547831102523943e-05, "loss": 1.1793, "step": 17101 }, { "epoch": 0.47, "learning_rate": 1.1546957248936563e-05, "loss": 1.3989, "step": 17102 }, { "epoch": 0.47, "learning_rate": 1.154608338324652e-05, "loss": 1.4087, "step": 17103 }, { "epoch": 0.47, "learning_rate": 1.1545209505460645e-05, "loss": 1.3616, "step": 17104 }, { "epoch": 0.47, "learning_rate": 1.154433561558578e-05, "loss": 1.3679, "step": 17105 }, { "epoch": 0.47, "learning_rate": 1.1543461713628759e-05, "loss": 1.3921, "step": 17106 }, { "epoch": 0.47, "learning_rate": 1.1542587799596418e-05, "loss": 1.3552, "step": 17107 }, { "epoch": 0.47, "learning_rate": 1.1541713873495595e-05, "loss": 1.2827, "step": 17108 }, { "epoch": 0.47, "learning_rate": 1.154083993533313e-05, "loss": 1.1934, "step": 17109 }, { "epoch": 0.47, "learning_rate": 1.1539965985115856e-05, "loss": 1.2739, "step": 17110 }, { "epoch": 0.47, "learning_rate": 1.1539092022850614e-05, "loss": 1.3137, "step": 17111 }, { "epoch": 0.47, "learning_rate": 1.1538218048544236e-05, "loss": 1.2322, "step": 17112 }, { "epoch": 0.47, "learning_rate": 1.1537344062203568e-05, "loss": 1.4202, "step": 17113 }, { "epoch": 0.47, "learning_rate": 1.1536470063835439e-05, "loss": 1.3445, "step": 17114 }, { "epoch": 0.47, "learning_rate": 1.1535596053446692e-05, "loss": 1.3625, "step": 17115 }, { "epoch": 0.47, "learning_rate": 1.1534722031044166e-05, "loss": 1.3452, "step": 17116 }, { "epoch": 0.47, "learning_rate": 1.1533847996634693e-05, "loss": 1.3135, "step": 17117 }, { "epoch": 0.47, "learning_rate": 1.1532973950225117e-05, "loss": 1.3965, "step": 17118 }, { "epoch": 0.47, "learning_rate": 1.1532099891822272e-05, "loss": 1.2317, "step": 17119 }, { "epoch": 0.47, "learning_rate": 1.1531225821432998e-05, "loss": 1.1497, "step": 17120 }, { "epoch": 0.47, "learning_rate": 1.1530351739064134e-05, "loss": 1.3757, "step": 17121 }, { "epoch": 0.47, "learning_rate": 1.152947764472252e-05, "loss": 1.1655, "step": 17122 }, { "epoch": 0.47, "learning_rate": 1.1528603538414989e-05, "loss": 1.2778, "step": 17123 }, { "epoch": 0.47, "learning_rate": 1.1527729420148383e-05, "loss": 1.3989, "step": 17124 }, { "epoch": 0.47, "learning_rate": 1.1526855289929539e-05, "loss": 1.1677, "step": 17125 }, { "epoch": 0.47, "learning_rate": 1.15259811477653e-05, "loss": 1.198, "step": 17126 }, { "epoch": 0.47, "learning_rate": 1.1525106993662501e-05, "loss": 1.3896, "step": 17127 }, { "epoch": 0.47, "learning_rate": 1.152423282762798e-05, "loss": 1.3293, "step": 17128 }, { "epoch": 0.47, "learning_rate": 1.1523358649668579e-05, "loss": 1.1982, "step": 17129 }, { "epoch": 0.47, "learning_rate": 1.1522484459791139e-05, "loss": 1.3003, "step": 17130 }, { "epoch": 0.47, "learning_rate": 1.1521610258002494e-05, "loss": 1.3857, "step": 17131 }, { "epoch": 0.47, "learning_rate": 1.1520736044309486e-05, "loss": 1.3662, "step": 17132 }, { "epoch": 0.47, "learning_rate": 1.1519861818718956e-05, "loss": 1.2795, "step": 17133 }, { "epoch": 0.47, "learning_rate": 1.1518987581237741e-05, "loss": 1.3552, "step": 17134 }, { "epoch": 0.47, "learning_rate": 1.151811333187268e-05, "loss": 1.4141, "step": 17135 }, { "epoch": 0.47, "learning_rate": 1.1517239070630617e-05, "loss": 1.3579, "step": 17136 }, { "epoch": 0.47, "learning_rate": 1.1516364797518386e-05, "loss": 1.3433, "step": 17137 }, { "epoch": 0.47, "learning_rate": 1.1515490512542833e-05, "loss": 1.283, "step": 17138 }, { "epoch": 0.47, "learning_rate": 1.1514616215710793e-05, "loss": 1.3296, "step": 17139 }, { "epoch": 0.47, "learning_rate": 1.1513741907029108e-05, "loss": 1.3726, "step": 17140 }, { "epoch": 0.47, "learning_rate": 1.1512867586504618e-05, "loss": 1.2102, "step": 17141 }, { "epoch": 0.47, "learning_rate": 1.1511993254144165e-05, "loss": 1.2766, "step": 17142 }, { "epoch": 0.47, "learning_rate": 1.1511118909954585e-05, "loss": 1.3328, "step": 17143 }, { "epoch": 0.47, "learning_rate": 1.1510244553942723e-05, "loss": 1.356, "step": 17144 }, { "epoch": 0.47, "learning_rate": 1.1509370186115414e-05, "loss": 1.436, "step": 17145 }, { "epoch": 0.47, "learning_rate": 1.1508495806479506e-05, "loss": 1.2886, "step": 17146 }, { "epoch": 0.47, "learning_rate": 1.1507621415041837e-05, "loss": 1.2695, "step": 17147 }, { "epoch": 0.47, "learning_rate": 1.1506747011809245e-05, "loss": 1.2009, "step": 17148 }, { "epoch": 0.47, "learning_rate": 1.1505872596788574e-05, "loss": 1.1792, "step": 17149 }, { "epoch": 0.47, "learning_rate": 1.1504998169986665e-05, "loss": 1.231, "step": 17150 }, { "epoch": 0.47, "learning_rate": 1.1504123731410355e-05, "loss": 1.293, "step": 17151 }, { "epoch": 0.47, "learning_rate": 1.150324928106649e-05, "loss": 1.3503, "step": 17152 }, { "epoch": 0.47, "learning_rate": 1.150237481896191e-05, "loss": 1.366, "step": 17153 }, { "epoch": 0.47, "learning_rate": 1.1501500345103456e-05, "loss": 1.2493, "step": 17154 }, { "epoch": 0.47, "learning_rate": 1.1500625859497968e-05, "loss": 1.2637, "step": 17155 }, { "epoch": 0.47, "learning_rate": 1.1499751362152291e-05, "loss": 1.2168, "step": 17156 }, { "epoch": 0.47, "learning_rate": 1.1498876853073261e-05, "loss": 1.2642, "step": 17157 }, { "epoch": 0.47, "learning_rate": 1.1498002332267728e-05, "loss": 1.2952, "step": 17158 }, { "epoch": 0.47, "learning_rate": 1.1497127799742524e-05, "loss": 1.3867, "step": 17159 }, { "epoch": 0.47, "learning_rate": 1.1496253255504499e-05, "loss": 1.2937, "step": 17160 }, { "epoch": 0.47, "learning_rate": 1.1495378699560491e-05, "loss": 1.3333, "step": 17161 }, { "epoch": 0.47, "learning_rate": 1.1494504131917346e-05, "loss": 1.2917, "step": 17162 }, { "epoch": 0.47, "learning_rate": 1.14936295525819e-05, "loss": 1.3291, "step": 17163 }, { "epoch": 0.47, "learning_rate": 1.1492754961561e-05, "loss": 1.2847, "step": 17164 }, { "epoch": 0.47, "learning_rate": 1.1491880358861488e-05, "loss": 1.2632, "step": 17165 }, { "epoch": 0.47, "learning_rate": 1.1491005744490206e-05, "loss": 1.3447, "step": 17166 }, { "epoch": 0.47, "learning_rate": 1.1490131118453993e-05, "loss": 1.4104, "step": 17167 }, { "epoch": 0.47, "learning_rate": 1.1489256480759699e-05, "loss": 1.2971, "step": 17168 }, { "epoch": 0.47, "learning_rate": 1.1488381831414159e-05, "loss": 1.3679, "step": 17169 }, { "epoch": 0.47, "learning_rate": 1.1487507170424224e-05, "loss": 1.3406, "step": 17170 }, { "epoch": 0.47, "learning_rate": 1.1486632497796728e-05, "loss": 1.4666, "step": 17171 }, { "epoch": 0.47, "learning_rate": 1.148575781353852e-05, "loss": 1.3008, "step": 17172 }, { "epoch": 0.47, "learning_rate": 1.148488311765644e-05, "loss": 1.2932, "step": 17173 }, { "epoch": 0.47, "learning_rate": 1.1484008410157337e-05, "loss": 1.3044, "step": 17174 }, { "epoch": 0.47, "learning_rate": 1.1483133691048044e-05, "loss": 1.2251, "step": 17175 }, { "epoch": 0.47, "learning_rate": 1.1482258960335414e-05, "loss": 1.3369, "step": 17176 }, { "epoch": 0.47, "learning_rate": 1.1481384218026289e-05, "loss": 1.1306, "step": 17177 }, { "epoch": 0.47, "learning_rate": 1.1480509464127505e-05, "loss": 1.1394, "step": 17178 }, { "epoch": 0.47, "learning_rate": 1.1479634698645916e-05, "loss": 1.2863, "step": 17179 }, { "epoch": 0.47, "learning_rate": 1.1478759921588356e-05, "loss": 1.2439, "step": 17180 }, { "epoch": 0.47, "learning_rate": 1.1477885132961679e-05, "loss": 1.2788, "step": 17181 }, { "epoch": 0.47, "learning_rate": 1.147701033277272e-05, "loss": 1.4106, "step": 17182 }, { "epoch": 0.47, "learning_rate": 1.1476135521028329e-05, "loss": 1.3777, "step": 17183 }, { "epoch": 0.47, "learning_rate": 1.1475260697735346e-05, "loss": 1.1416, "step": 17184 }, { "epoch": 0.47, "learning_rate": 1.147438586290062e-05, "loss": 1.2544, "step": 17185 }, { "epoch": 0.47, "learning_rate": 1.147351101653099e-05, "loss": 1.3418, "step": 17186 }, { "epoch": 0.47, "learning_rate": 1.1472636158633304e-05, "loss": 1.2383, "step": 17187 }, { "epoch": 0.47, "learning_rate": 1.1471761289214403e-05, "loss": 1.4185, "step": 17188 }, { "epoch": 0.47, "learning_rate": 1.1470886408281135e-05, "loss": 1.2966, "step": 17189 }, { "epoch": 0.47, "learning_rate": 1.1470011515840343e-05, "loss": 1.4487, "step": 17190 }, { "epoch": 0.47, "learning_rate": 1.146913661189887e-05, "loss": 1.2983, "step": 17191 }, { "epoch": 0.47, "learning_rate": 1.1468261696463566e-05, "loss": 1.3003, "step": 17192 }, { "epoch": 0.47, "learning_rate": 1.146738676954127e-05, "loss": 1.1731, "step": 17193 }, { "epoch": 0.47, "learning_rate": 1.1466511831138834e-05, "loss": 1.3779, "step": 17194 }, { "epoch": 0.47, "learning_rate": 1.1465636881263098e-05, "loss": 1.3003, "step": 17195 }, { "epoch": 0.47, "learning_rate": 1.1464761919920906e-05, "loss": 1.2959, "step": 17196 }, { "epoch": 0.47, "learning_rate": 1.1463886947119108e-05, "loss": 1.384, "step": 17197 }, { "epoch": 0.47, "learning_rate": 1.1463011962864546e-05, "loss": 1.303, "step": 17198 }, { "epoch": 0.47, "learning_rate": 1.1462136967164066e-05, "loss": 1.3069, "step": 17199 }, { "epoch": 0.47, "learning_rate": 1.1461261960024513e-05, "loss": 1.3152, "step": 17200 }, { "epoch": 0.47, "learning_rate": 1.1460386941452736e-05, "loss": 1.1421, "step": 17201 }, { "epoch": 0.47, "learning_rate": 1.1459511911455576e-05, "loss": 1.3574, "step": 17202 }, { "epoch": 0.47, "learning_rate": 1.1458636870039883e-05, "loss": 1.3647, "step": 17203 }, { "epoch": 0.47, "learning_rate": 1.1457761817212499e-05, "loss": 1.4897, "step": 17204 }, { "epoch": 0.47, "learning_rate": 1.1456886752980274e-05, "loss": 1.2449, "step": 17205 }, { "epoch": 0.47, "learning_rate": 1.1456011677350052e-05, "loss": 1.3982, "step": 17206 }, { "epoch": 0.47, "learning_rate": 1.1455136590328677e-05, "loss": 1.3625, "step": 17207 }, { "epoch": 0.47, "learning_rate": 1.1454261491922998e-05, "loss": 1.1709, "step": 17208 }, { "epoch": 0.47, "learning_rate": 1.1453386382139862e-05, "loss": 1.3982, "step": 17209 }, { "epoch": 0.47, "learning_rate": 1.1452511260986114e-05, "loss": 1.2295, "step": 17210 }, { "epoch": 0.47, "learning_rate": 1.1451636128468602e-05, "loss": 1.749, "step": 17211 }, { "epoch": 0.47, "learning_rate": 1.1450760984594172e-05, "loss": 1.3481, "step": 17212 }, { "epoch": 0.47, "learning_rate": 1.1449885829369668e-05, "loss": 1.2334, "step": 17213 }, { "epoch": 0.47, "learning_rate": 1.144901066280194e-05, "loss": 1.3564, "step": 17214 }, { "epoch": 0.47, "learning_rate": 1.1448135484897835e-05, "loss": 1.4487, "step": 17215 }, { "epoch": 0.47, "learning_rate": 1.1447260295664198e-05, "loss": 1.4424, "step": 17216 }, { "epoch": 0.47, "learning_rate": 1.1446385095107876e-05, "loss": 1.3677, "step": 17217 }, { "epoch": 0.47, "learning_rate": 1.1445509883235719e-05, "loss": 1.283, "step": 17218 }, { "epoch": 0.47, "learning_rate": 1.1444634660054571e-05, "loss": 1.2131, "step": 17219 }, { "epoch": 0.47, "learning_rate": 1.144375942557128e-05, "loss": 1.375, "step": 17220 }, { "epoch": 0.47, "learning_rate": 1.1442884179792699e-05, "loss": 1.3677, "step": 17221 }, { "epoch": 0.47, "learning_rate": 1.1442008922725665e-05, "loss": 1.2888, "step": 17222 }, { "epoch": 0.47, "learning_rate": 1.1441133654377033e-05, "loss": 1.1809, "step": 17223 }, { "epoch": 0.47, "learning_rate": 1.144025837475365e-05, "loss": 1.3074, "step": 17224 }, { "epoch": 0.47, "learning_rate": 1.1439383083862362e-05, "loss": 1.2871, "step": 17225 }, { "epoch": 0.47, "learning_rate": 1.1438507781710017e-05, "loss": 1.1902, "step": 17226 }, { "epoch": 0.47, "learning_rate": 1.1437632468303466e-05, "loss": 1.0764, "step": 17227 }, { "epoch": 0.47, "learning_rate": 1.1436757143649554e-05, "loss": 1.1034, "step": 17228 }, { "epoch": 0.47, "learning_rate": 1.1435881807755126e-05, "loss": 1.2344, "step": 17229 }, { "epoch": 0.47, "learning_rate": 1.1435006460627038e-05, "loss": 1.1572, "step": 17230 }, { "epoch": 0.47, "learning_rate": 1.1434131102272133e-05, "loss": 1.3232, "step": 17231 }, { "epoch": 0.47, "learning_rate": 1.143325573269726e-05, "loss": 1.4551, "step": 17232 }, { "epoch": 0.47, "learning_rate": 1.1432380351909268e-05, "loss": 1.0864, "step": 17233 }, { "epoch": 0.47, "learning_rate": 1.1431504959915007e-05, "loss": 1.3206, "step": 17234 }, { "epoch": 0.47, "learning_rate": 1.1430629556721322e-05, "loss": 1.2881, "step": 17235 }, { "epoch": 0.47, "learning_rate": 1.1429754142335069e-05, "loss": 1.3806, "step": 17236 }, { "epoch": 0.47, "learning_rate": 1.1428878716763086e-05, "loss": 1.1819, "step": 17237 }, { "epoch": 0.47, "learning_rate": 1.142800328001223e-05, "loss": 1.1973, "step": 17238 }, { "epoch": 0.47, "learning_rate": 1.1427127832089346e-05, "loss": 1.3032, "step": 17239 }, { "epoch": 0.47, "learning_rate": 1.142625237300129e-05, "loss": 1.3987, "step": 17240 }, { "epoch": 0.47, "learning_rate": 1.1425376902754901e-05, "loss": 1.2617, "step": 17241 }, { "epoch": 0.47, "learning_rate": 1.1424501421357038e-05, "loss": 1.1088, "step": 17242 }, { "epoch": 0.47, "learning_rate": 1.1423625928814541e-05, "loss": 1.4658, "step": 17243 }, { "epoch": 0.47, "learning_rate": 1.1422750425134268e-05, "loss": 1.2485, "step": 17244 }, { "epoch": 0.47, "learning_rate": 1.1421874910323063e-05, "loss": 1.1843, "step": 17245 }, { "epoch": 0.47, "learning_rate": 1.1420999384387778e-05, "loss": 1.2495, "step": 17246 }, { "epoch": 0.47, "learning_rate": 1.142012384733526e-05, "loss": 1.3208, "step": 17247 }, { "epoch": 0.47, "learning_rate": 1.1419248299172363e-05, "loss": 1.3169, "step": 17248 }, { "epoch": 0.47, "learning_rate": 1.1418372739905935e-05, "loss": 1.4014, "step": 17249 }, { "epoch": 0.47, "learning_rate": 1.1417497169542823e-05, "loss": 1.2991, "step": 17250 }, { "epoch": 0.47, "learning_rate": 1.1416621588089882e-05, "loss": 1.2429, "step": 17251 }, { "epoch": 0.47, "learning_rate": 1.141574599555396e-05, "loss": 1.2207, "step": 17252 }, { "epoch": 0.47, "learning_rate": 1.1414870391941904e-05, "loss": 1.1121, "step": 17253 }, { "epoch": 0.47, "learning_rate": 1.1413994777260568e-05, "loss": 1.2607, "step": 17254 }, { "epoch": 0.47, "learning_rate": 1.1413119151516804e-05, "loss": 1.2427, "step": 17255 }, { "epoch": 0.47, "learning_rate": 1.141224351471746e-05, "loss": 1.3323, "step": 17256 }, { "epoch": 0.47, "learning_rate": 1.1411367866869387e-05, "loss": 1.249, "step": 17257 }, { "epoch": 0.47, "learning_rate": 1.1410492207979435e-05, "loss": 1.4104, "step": 17258 }, { "epoch": 0.47, "learning_rate": 1.1409616538054456e-05, "loss": 1.2214, "step": 17259 }, { "epoch": 0.47, "learning_rate": 1.1408740857101298e-05, "loss": 1.3137, "step": 17260 }, { "epoch": 0.47, "learning_rate": 1.1407865165126815e-05, "loss": 1.2207, "step": 17261 }, { "epoch": 0.47, "learning_rate": 1.1406989462137858e-05, "loss": 1.0972, "step": 17262 }, { "epoch": 0.47, "learning_rate": 1.1406113748141276e-05, "loss": 1.3672, "step": 17263 }, { "epoch": 0.47, "learning_rate": 1.1405238023143923e-05, "loss": 1.1079, "step": 17264 }, { "epoch": 0.47, "learning_rate": 1.1404362287152646e-05, "loss": 1.241, "step": 17265 }, { "epoch": 0.47, "learning_rate": 1.14034865401743e-05, "loss": 1.1995, "step": 17266 }, { "epoch": 0.47, "learning_rate": 1.1402610782215735e-05, "loss": 1.3645, "step": 17267 }, { "epoch": 0.47, "learning_rate": 1.1401735013283803e-05, "loss": 1.3809, "step": 17268 }, { "epoch": 0.47, "learning_rate": 1.1400859233385355e-05, "loss": 1.2959, "step": 17269 }, { "epoch": 0.47, "learning_rate": 1.1399983442527243e-05, "loss": 1.4058, "step": 17270 }, { "epoch": 0.47, "learning_rate": 1.1399107640716318e-05, "loss": 1.5303, "step": 17271 }, { "epoch": 0.47, "learning_rate": 1.1398231827959434e-05, "loss": 1.3269, "step": 17272 }, { "epoch": 0.47, "learning_rate": 1.1397356004263442e-05, "loss": 1.1394, "step": 17273 }, { "epoch": 0.47, "learning_rate": 1.1396480169635194e-05, "loss": 1.3257, "step": 17274 }, { "epoch": 0.47, "learning_rate": 1.139560432408154e-05, "loss": 1.4131, "step": 17275 }, { "epoch": 0.47, "learning_rate": 1.1394728467609336e-05, "loss": 1.2676, "step": 17276 }, { "epoch": 0.47, "learning_rate": 1.139385260022543e-05, "loss": 1.355, "step": 17277 }, { "epoch": 0.47, "learning_rate": 1.139297672193668e-05, "loss": 1.4102, "step": 17278 }, { "epoch": 0.47, "learning_rate": 1.1392100832749933e-05, "loss": 1.3018, "step": 17279 }, { "epoch": 0.47, "learning_rate": 1.1391224932672045e-05, "loss": 1.3447, "step": 17280 }, { "epoch": 0.47, "learning_rate": 1.1390349021709865e-05, "loss": 1.3164, "step": 17281 }, { "epoch": 0.47, "learning_rate": 1.138947309987025e-05, "loss": 1.3267, "step": 17282 }, { "epoch": 0.47, "learning_rate": 1.138859716716005e-05, "loss": 1.1353, "step": 17283 }, { "epoch": 0.47, "learning_rate": 1.1387721223586117e-05, "loss": 1.0273, "step": 17284 }, { "epoch": 0.47, "learning_rate": 1.138684526915531e-05, "loss": 1.3601, "step": 17285 }, { "epoch": 0.47, "learning_rate": 1.1385969303874473e-05, "loss": 1.3457, "step": 17286 }, { "epoch": 0.47, "learning_rate": 1.1385093327750467e-05, "loss": 1.281, "step": 17287 }, { "epoch": 0.47, "learning_rate": 1.1384217340790142e-05, "loss": 1.1516, "step": 17288 }, { "epoch": 0.47, "learning_rate": 1.1383341343000351e-05, "loss": 1.592, "step": 17289 }, { "epoch": 0.47, "learning_rate": 1.1382465334387946e-05, "loss": 1.1665, "step": 17290 }, { "epoch": 0.47, "learning_rate": 1.1381589314959787e-05, "loss": 1.6895, "step": 17291 }, { "epoch": 0.47, "learning_rate": 1.1380713284722717e-05, "loss": 1.3389, "step": 17292 }, { "epoch": 0.47, "learning_rate": 1.13798372436836e-05, "loss": 1.3662, "step": 17293 }, { "epoch": 0.47, "learning_rate": 1.1378961191849282e-05, "loss": 1.2695, "step": 17294 }, { "epoch": 0.47, "learning_rate": 1.1378085129226624e-05, "loss": 1.2876, "step": 17295 }, { "epoch": 0.47, "learning_rate": 1.1377209055822473e-05, "loss": 1.386, "step": 17296 }, { "epoch": 0.47, "learning_rate": 1.1376332971643688e-05, "loss": 1.1758, "step": 17297 }, { "epoch": 0.47, "learning_rate": 1.1375456876697118e-05, "loss": 1.2158, "step": 17298 }, { "epoch": 0.47, "learning_rate": 1.1374580770989622e-05, "loss": 1.2605, "step": 17299 }, { "epoch": 0.47, "learning_rate": 1.137370465452805e-05, "loss": 1.3579, "step": 17300 }, { "epoch": 0.47, "learning_rate": 1.1372828527319262e-05, "loss": 1.2803, "step": 17301 }, { "epoch": 0.47, "learning_rate": 1.1371952389370107e-05, "loss": 1.2786, "step": 17302 }, { "epoch": 0.47, "learning_rate": 1.1371076240687444e-05, "loss": 1.1423, "step": 17303 }, { "epoch": 0.47, "learning_rate": 1.1370200081278124e-05, "loss": 1.2578, "step": 17304 }, { "epoch": 0.47, "learning_rate": 1.1369323911149004e-05, "loss": 1.2366, "step": 17305 }, { "epoch": 0.47, "learning_rate": 1.1368447730306935e-05, "loss": 1.1233, "step": 17306 }, { "epoch": 0.47, "learning_rate": 1.1367571538758777e-05, "loss": 1.3638, "step": 17307 }, { "epoch": 0.47, "learning_rate": 1.136669533651138e-05, "loss": 1.1693, "step": 17308 }, { "epoch": 0.47, "learning_rate": 1.1365819123571605e-05, "loss": 1.2896, "step": 17309 }, { "epoch": 0.47, "learning_rate": 1.1364942899946301e-05, "loss": 1.3088, "step": 17310 }, { "epoch": 0.47, "learning_rate": 1.1364066665642326e-05, "loss": 1.2849, "step": 17311 }, { "epoch": 0.47, "learning_rate": 1.1363190420666532e-05, "loss": 1.2286, "step": 17312 }, { "epoch": 0.47, "learning_rate": 1.1362314165025782e-05, "loss": 1.094, "step": 17313 }, { "epoch": 0.47, "learning_rate": 1.1361437898726923e-05, "loss": 1.2617, "step": 17314 }, { "epoch": 0.47, "learning_rate": 1.1360561621776816e-05, "loss": 1.3533, "step": 17315 }, { "epoch": 0.47, "learning_rate": 1.135968533418231e-05, "loss": 1.2305, "step": 17316 }, { "epoch": 0.47, "learning_rate": 1.135880903595027e-05, "loss": 1.3232, "step": 17317 }, { "epoch": 0.47, "learning_rate": 1.1357932727087548e-05, "loss": 1.334, "step": 17318 }, { "epoch": 0.47, "learning_rate": 1.1357056407600997e-05, "loss": 1.2869, "step": 17319 }, { "epoch": 0.47, "learning_rate": 1.1356180077497474e-05, "loss": 1.2554, "step": 17320 }, { "epoch": 0.47, "learning_rate": 1.1355303736783838e-05, "loss": 1.438, "step": 17321 }, { "epoch": 0.47, "learning_rate": 1.1354427385466942e-05, "loss": 1.2682, "step": 17322 }, { "epoch": 0.47, "learning_rate": 1.1353551023553644e-05, "loss": 1.7085, "step": 17323 }, { "epoch": 0.47, "learning_rate": 1.1352674651050797e-05, "loss": 1.3347, "step": 17324 }, { "epoch": 0.47, "learning_rate": 1.1351798267965261e-05, "loss": 1.3787, "step": 17325 }, { "epoch": 0.47, "learning_rate": 1.135092187430389e-05, "loss": 1.2151, "step": 17326 }, { "epoch": 0.47, "learning_rate": 1.1350045470073543e-05, "loss": 1.1899, "step": 17327 }, { "epoch": 0.47, "learning_rate": 1.1349169055281073e-05, "loss": 1.3467, "step": 17328 }, { "epoch": 0.47, "learning_rate": 1.1348292629933342e-05, "loss": 1.4333, "step": 17329 }, { "epoch": 0.47, "learning_rate": 1.13474161940372e-05, "loss": 1.2739, "step": 17330 }, { "epoch": 0.47, "learning_rate": 1.1346539747599508e-05, "loss": 1.4668, "step": 17331 }, { "epoch": 0.47, "learning_rate": 1.1345663290627126e-05, "loss": 1.3577, "step": 17332 }, { "epoch": 0.47, "learning_rate": 1.1344786823126901e-05, "loss": 1.4265, "step": 17333 }, { "epoch": 0.47, "learning_rate": 1.13439103451057e-05, "loss": 1.3418, "step": 17334 }, { "epoch": 0.47, "learning_rate": 1.1343033856570376e-05, "loss": 1.1755, "step": 17335 }, { "epoch": 0.47, "learning_rate": 1.1342157357527788e-05, "loss": 1.2888, "step": 17336 }, { "epoch": 0.47, "learning_rate": 1.1341280847984788e-05, "loss": 1.2261, "step": 17337 }, { "epoch": 0.47, "learning_rate": 1.1340404327948242e-05, "loss": 1.1783, "step": 17338 }, { "epoch": 0.47, "learning_rate": 1.1339527797424998e-05, "loss": 1.3469, "step": 17339 }, { "epoch": 0.47, "learning_rate": 1.1338651256421925e-05, "loss": 1.2969, "step": 17340 }, { "epoch": 0.47, "learning_rate": 1.1337774704945868e-05, "loss": 1.3772, "step": 17341 }, { "epoch": 0.47, "learning_rate": 1.1336898143003694e-05, "loss": 1.332, "step": 17342 }, { "epoch": 0.47, "learning_rate": 1.1336021570602253e-05, "loss": 1.4084, "step": 17343 }, { "epoch": 0.47, "learning_rate": 1.1335144987748415e-05, "loss": 1.3083, "step": 17344 }, { "epoch": 0.47, "learning_rate": 1.1334268394449024e-05, "loss": 1.3586, "step": 17345 }, { "epoch": 0.47, "learning_rate": 1.1333391790710946e-05, "loss": 1.4062, "step": 17346 }, { "epoch": 0.47, "learning_rate": 1.1332515176541038e-05, "loss": 1.2266, "step": 17347 }, { "epoch": 0.47, "learning_rate": 1.1331638551946158e-05, "loss": 1.2847, "step": 17348 }, { "epoch": 0.47, "learning_rate": 1.1330761916933164e-05, "loss": 1.3652, "step": 17349 }, { "epoch": 0.47, "learning_rate": 1.1329885271508915e-05, "loss": 1.3525, "step": 17350 }, { "epoch": 0.47, "learning_rate": 1.132900861568027e-05, "loss": 1.332, "step": 17351 }, { "epoch": 0.47, "learning_rate": 1.1328131949454086e-05, "loss": 1.3003, "step": 17352 }, { "epoch": 0.47, "learning_rate": 1.1327255272837221e-05, "loss": 1.3022, "step": 17353 }, { "epoch": 0.47, "learning_rate": 1.1326378585836537e-05, "loss": 1.3794, "step": 17354 }, { "epoch": 0.47, "learning_rate": 1.1325501888458887e-05, "loss": 1.2917, "step": 17355 }, { "epoch": 0.47, "learning_rate": 1.1324625180711137e-05, "loss": 1.4409, "step": 17356 }, { "epoch": 0.47, "learning_rate": 1.1323748462600142e-05, "loss": 1.3877, "step": 17357 }, { "epoch": 0.47, "learning_rate": 1.1322871734132761e-05, "loss": 1.3467, "step": 17358 }, { "epoch": 0.47, "learning_rate": 1.1321994995315853e-05, "loss": 1.3174, "step": 17359 }, { "epoch": 0.47, "learning_rate": 1.1321118246156277e-05, "loss": 1.2646, "step": 17360 }, { "epoch": 0.47, "learning_rate": 1.1320241486660895e-05, "loss": 1.189, "step": 17361 }, { "epoch": 0.47, "learning_rate": 1.1319364716836564e-05, "loss": 1.2896, "step": 17362 }, { "epoch": 0.47, "learning_rate": 1.131848793669014e-05, "loss": 1.397, "step": 17363 }, { "epoch": 0.47, "learning_rate": 1.1317611146228492e-05, "loss": 1.4282, "step": 17364 }, { "epoch": 0.47, "learning_rate": 1.1316734345458472e-05, "loss": 1.2263, "step": 17365 }, { "epoch": 0.47, "learning_rate": 1.131585753438694e-05, "loss": 1.1743, "step": 17366 }, { "epoch": 0.47, "learning_rate": 1.1314980713020757e-05, "loss": 1.6985, "step": 17367 }, { "epoch": 0.47, "learning_rate": 1.1314103881366786e-05, "loss": 1.2556, "step": 17368 }, { "epoch": 0.47, "learning_rate": 1.1313227039431885e-05, "loss": 1.6057, "step": 17369 }, { "epoch": 0.47, "learning_rate": 1.1312350187222911e-05, "loss": 1.2925, "step": 17370 }, { "epoch": 0.47, "learning_rate": 1.1311473324746728e-05, "loss": 1.3533, "step": 17371 }, { "epoch": 0.47, "learning_rate": 1.1310596452010195e-05, "loss": 1.157, "step": 17372 }, { "epoch": 0.47, "learning_rate": 1.1309719569020166e-05, "loss": 1.2891, "step": 17373 }, { "epoch": 0.47, "learning_rate": 1.1308842675783513e-05, "loss": 1.2778, "step": 17374 }, { "epoch": 0.47, "learning_rate": 1.1307965772307086e-05, "loss": 1.1794, "step": 17375 }, { "epoch": 0.47, "learning_rate": 1.1307088858597755e-05, "loss": 1.2861, "step": 17376 }, { "epoch": 0.47, "learning_rate": 1.130621193466237e-05, "loss": 1.2517, "step": 17377 }, { "epoch": 0.47, "learning_rate": 1.1305335000507797e-05, "loss": 1.3979, "step": 17378 }, { "epoch": 0.47, "learning_rate": 1.1304458056140902e-05, "loss": 1.2502, "step": 17379 }, { "epoch": 0.47, "learning_rate": 1.1303581101568537e-05, "loss": 1.2542, "step": 17380 }, { "epoch": 0.47, "learning_rate": 1.1302704136797568e-05, "loss": 1.2054, "step": 17381 }, { "epoch": 0.47, "learning_rate": 1.1301827161834853e-05, "loss": 1.3101, "step": 17382 }, { "epoch": 0.47, "learning_rate": 1.1300950176687255e-05, "loss": 1.3669, "step": 17383 }, { "epoch": 0.47, "learning_rate": 1.1300073181361634e-05, "loss": 1.1272, "step": 17384 }, { "epoch": 0.47, "learning_rate": 1.1299196175864852e-05, "loss": 1.2856, "step": 17385 }, { "epoch": 0.47, "learning_rate": 1.1298319160203771e-05, "loss": 1.2935, "step": 17386 }, { "epoch": 0.47, "learning_rate": 1.1297442134385253e-05, "loss": 1.3623, "step": 17387 }, { "epoch": 0.47, "learning_rate": 1.1296565098416154e-05, "loss": 1.3345, "step": 17388 }, { "epoch": 0.47, "learning_rate": 1.1295688052303342e-05, "loss": 1.2942, "step": 17389 }, { "epoch": 0.47, "learning_rate": 1.1294810996053673e-05, "loss": 1.2292, "step": 17390 }, { "epoch": 0.47, "learning_rate": 1.1293933929674012e-05, "loss": 1.4768, "step": 17391 }, { "epoch": 0.47, "learning_rate": 1.1293056853171226e-05, "loss": 1.3645, "step": 17392 }, { "epoch": 0.47, "learning_rate": 1.1292179766552165e-05, "loss": 1.3765, "step": 17393 }, { "epoch": 0.48, "learning_rate": 1.1291302669823699e-05, "loss": 1.3538, "step": 17394 }, { "epoch": 0.48, "learning_rate": 1.129042556299269e-05, "loss": 1.3334, "step": 17395 }, { "epoch": 0.48, "learning_rate": 1.1289548446065994e-05, "loss": 1.2549, "step": 17396 }, { "epoch": 0.48, "learning_rate": 1.1288671319050482e-05, "loss": 1.4048, "step": 17397 }, { "epoch": 0.48, "learning_rate": 1.1287794181953008e-05, "loss": 1.3765, "step": 17398 }, { "epoch": 0.48, "learning_rate": 1.128691703478044e-05, "loss": 1.251, "step": 17399 }, { "epoch": 0.48, "learning_rate": 1.1286039877539638e-05, "loss": 1.2579, "step": 17400 }, { "epoch": 0.48, "learning_rate": 1.1285162710237464e-05, "loss": 1.2136, "step": 17401 }, { "epoch": 0.48, "learning_rate": 1.128428553288078e-05, "loss": 1.7144, "step": 17402 }, { "epoch": 0.48, "learning_rate": 1.1283408345476455e-05, "loss": 1.478, "step": 17403 }, { "epoch": 0.48, "learning_rate": 1.1282531148031341e-05, "loss": 1.1987, "step": 17404 }, { "epoch": 0.48, "learning_rate": 1.128165394055231e-05, "loss": 1.6118, "step": 17405 }, { "epoch": 0.48, "learning_rate": 1.1280776723046221e-05, "loss": 1.4087, "step": 17406 }, { "epoch": 0.48, "learning_rate": 1.1279899495519937e-05, "loss": 1.2549, "step": 17407 }, { "epoch": 0.48, "learning_rate": 1.1279022257980317e-05, "loss": 1.301, "step": 17408 }, { "epoch": 0.48, "learning_rate": 1.1278145010434232e-05, "loss": 1.4702, "step": 17409 }, { "epoch": 0.48, "learning_rate": 1.1277267752888541e-05, "loss": 1.3901, "step": 17410 }, { "epoch": 0.48, "learning_rate": 1.1276390485350108e-05, "loss": 1.2593, "step": 17411 }, { "epoch": 0.48, "learning_rate": 1.1275513207825794e-05, "loss": 1.2634, "step": 17412 }, { "epoch": 0.48, "learning_rate": 1.1274635920322467e-05, "loss": 1.2664, "step": 17413 }, { "epoch": 0.48, "learning_rate": 1.1273758622846986e-05, "loss": 1.4062, "step": 17414 }, { "epoch": 0.48, "learning_rate": 1.1272881315406221e-05, "loss": 1.188, "step": 17415 }, { "epoch": 0.48, "learning_rate": 1.1272003998007025e-05, "loss": 1.3308, "step": 17416 }, { "epoch": 0.48, "learning_rate": 1.1271126670656272e-05, "loss": 1.1941, "step": 17417 }, { "epoch": 0.48, "learning_rate": 1.1270249333360821e-05, "loss": 1.3503, "step": 17418 }, { "epoch": 0.48, "learning_rate": 1.1269371986127538e-05, "loss": 1.3823, "step": 17419 }, { "epoch": 0.48, "learning_rate": 1.126849462896328e-05, "loss": 1.4417, "step": 17420 }, { "epoch": 0.48, "learning_rate": 1.1267617261874922e-05, "loss": 1.3528, "step": 17421 }, { "epoch": 0.48, "learning_rate": 1.126673988486932e-05, "loss": 1.3394, "step": 17422 }, { "epoch": 0.48, "learning_rate": 1.1265862497953342e-05, "loss": 1.2834, "step": 17423 }, { "epoch": 0.48, "learning_rate": 1.1264985101133847e-05, "loss": 1.2007, "step": 17424 }, { "epoch": 0.48, "learning_rate": 1.1264107694417707e-05, "loss": 1.2686, "step": 17425 }, { "epoch": 0.48, "learning_rate": 1.1263230277811783e-05, "loss": 1.3042, "step": 17426 }, { "epoch": 0.48, "learning_rate": 1.126235285132294e-05, "loss": 1.3315, "step": 17427 }, { "epoch": 0.48, "learning_rate": 1.1261475414958038e-05, "loss": 1.1477, "step": 17428 }, { "epoch": 0.48, "learning_rate": 1.126059796872395e-05, "loss": 1.2583, "step": 17429 }, { "epoch": 0.48, "learning_rate": 1.1259720512627534e-05, "loss": 1.6289, "step": 17430 }, { "epoch": 0.48, "learning_rate": 1.1258843046675658e-05, "loss": 1.3289, "step": 17431 }, { "epoch": 0.48, "learning_rate": 1.1257965570875184e-05, "loss": 1.1682, "step": 17432 }, { "epoch": 0.48, "learning_rate": 1.1257088085232983e-05, "loss": 1.229, "step": 17433 }, { "epoch": 0.48, "learning_rate": 1.1256210589755913e-05, "loss": 1.3665, "step": 17434 }, { "epoch": 0.48, "learning_rate": 1.1255333084450844e-05, "loss": 1.3291, "step": 17435 }, { "epoch": 0.48, "learning_rate": 1.1254455569324636e-05, "loss": 1.3582, "step": 17436 }, { "epoch": 0.48, "learning_rate": 1.1253578044384162e-05, "loss": 1.302, "step": 17437 }, { "epoch": 0.48, "learning_rate": 1.1252700509636278e-05, "loss": 1.3325, "step": 17438 }, { "epoch": 0.48, "learning_rate": 1.1251822965087856e-05, "loss": 1.2798, "step": 17439 }, { "epoch": 0.48, "learning_rate": 1.1250945410745759e-05, "loss": 1.1106, "step": 17440 }, { "epoch": 0.48, "learning_rate": 1.1250067846616855e-05, "loss": 1.2227, "step": 17441 }, { "epoch": 0.48, "learning_rate": 1.1249190272708009e-05, "loss": 1.2344, "step": 17442 }, { "epoch": 0.48, "learning_rate": 1.1248312689026081e-05, "loss": 1.3533, "step": 17443 }, { "epoch": 0.48, "learning_rate": 1.1247435095577948e-05, "loss": 1.2449, "step": 17444 }, { "epoch": 0.48, "learning_rate": 1.1246557492370465e-05, "loss": 1.1936, "step": 17445 }, { "epoch": 0.48, "learning_rate": 1.1245679879410504e-05, "loss": 1.3743, "step": 17446 }, { "epoch": 0.48, "learning_rate": 1.1244802256704927e-05, "loss": 1.3186, "step": 17447 }, { "epoch": 0.48, "learning_rate": 1.1243924624260607e-05, "loss": 1.2444, "step": 17448 }, { "epoch": 0.48, "learning_rate": 1.1243046982084402e-05, "loss": 1.2686, "step": 17449 }, { "epoch": 0.48, "learning_rate": 1.1242169330183183e-05, "loss": 1.1787, "step": 17450 }, { "epoch": 0.48, "learning_rate": 1.1241291668563816e-05, "loss": 1.4829, "step": 17451 }, { "epoch": 0.48, "learning_rate": 1.1240413997233167e-05, "loss": 1.2898, "step": 17452 }, { "epoch": 0.48, "learning_rate": 1.1239536316198099e-05, "loss": 1.3721, "step": 17453 }, { "epoch": 0.48, "learning_rate": 1.1238658625465486e-05, "loss": 1.2993, "step": 17454 }, { "epoch": 0.48, "learning_rate": 1.1237780925042186e-05, "loss": 1.2539, "step": 17455 }, { "epoch": 0.48, "learning_rate": 1.1236903214935073e-05, "loss": 1.6646, "step": 17456 }, { "epoch": 0.48, "learning_rate": 1.1236025495151008e-05, "loss": 1.3147, "step": 17457 }, { "epoch": 0.48, "learning_rate": 1.1235147765696865e-05, "loss": 1.3589, "step": 17458 }, { "epoch": 0.48, "learning_rate": 1.1234270026579504e-05, "loss": 1.3079, "step": 17459 }, { "epoch": 0.48, "learning_rate": 1.1233392277805795e-05, "loss": 1.3044, "step": 17460 }, { "epoch": 0.48, "learning_rate": 1.1232514519382605e-05, "loss": 1.5088, "step": 17461 }, { "epoch": 0.48, "learning_rate": 1.12316367513168e-05, "loss": 1.2422, "step": 17462 }, { "epoch": 0.48, "learning_rate": 1.123075897361525e-05, "loss": 1.3152, "step": 17463 }, { "epoch": 0.48, "learning_rate": 1.122988118628482e-05, "loss": 1.3086, "step": 17464 }, { "epoch": 0.48, "learning_rate": 1.1229003389332377e-05, "loss": 1.2754, "step": 17465 }, { "epoch": 0.48, "learning_rate": 1.1228125582764794e-05, "loss": 1.3389, "step": 17466 }, { "epoch": 0.48, "learning_rate": 1.1227247766588927e-05, "loss": 1.4277, "step": 17467 }, { "epoch": 0.48, "learning_rate": 1.1226369940811655e-05, "loss": 1.22, "step": 17468 }, { "epoch": 0.48, "learning_rate": 1.122549210543984e-05, "loss": 1.1284, "step": 17469 }, { "epoch": 0.48, "learning_rate": 1.1224614260480349e-05, "loss": 1.165, "step": 17470 }, { "epoch": 0.48, "learning_rate": 1.1223736405940053e-05, "loss": 1.1477, "step": 17471 }, { "epoch": 0.48, "learning_rate": 1.122285854182582e-05, "loss": 1.3567, "step": 17472 }, { "epoch": 0.48, "learning_rate": 1.1221980668144516e-05, "loss": 1.187, "step": 17473 }, { "epoch": 0.48, "learning_rate": 1.122110278490301e-05, "loss": 1.2927, "step": 17474 }, { "epoch": 0.48, "learning_rate": 1.1220224892108172e-05, "loss": 1.356, "step": 17475 }, { "epoch": 0.48, "learning_rate": 1.1219346989766866e-05, "loss": 1.1953, "step": 17476 }, { "epoch": 0.48, "learning_rate": 1.1218469077885963e-05, "loss": 1.4348, "step": 17477 }, { "epoch": 0.48, "learning_rate": 1.1217591156472331e-05, "loss": 1.3643, "step": 17478 }, { "epoch": 0.48, "learning_rate": 1.1216713225532838e-05, "loss": 1.2952, "step": 17479 }, { "epoch": 0.48, "learning_rate": 1.1215835285074355e-05, "loss": 1.2446, "step": 17480 }, { "epoch": 0.48, "learning_rate": 1.1214957335103745e-05, "loss": 1.2427, "step": 17481 }, { "epoch": 0.48, "learning_rate": 1.1214079375627885e-05, "loss": 1.2317, "step": 17482 }, { "epoch": 0.48, "learning_rate": 1.1213201406653634e-05, "loss": 1.3242, "step": 17483 }, { "epoch": 0.48, "learning_rate": 1.1212323428187868e-05, "loss": 1.2151, "step": 17484 }, { "epoch": 0.48, "learning_rate": 1.1211445440237452e-05, "loss": 1.282, "step": 17485 }, { "epoch": 0.48, "learning_rate": 1.1210567442809255e-05, "loss": 1.7485, "step": 17486 }, { "epoch": 0.48, "learning_rate": 1.1209689435910152e-05, "loss": 1.2898, "step": 17487 }, { "epoch": 0.48, "learning_rate": 1.1208811419547005e-05, "loss": 1.1591, "step": 17488 }, { "epoch": 0.48, "learning_rate": 1.1207933393726686e-05, "loss": 1.3857, "step": 17489 }, { "epoch": 0.48, "learning_rate": 1.1207055358456064e-05, "loss": 1.2412, "step": 17490 }, { "epoch": 0.48, "learning_rate": 1.120617731374201e-05, "loss": 1.3074, "step": 17491 }, { "epoch": 0.48, "learning_rate": 1.1205299259591392e-05, "loss": 1.2422, "step": 17492 }, { "epoch": 0.48, "learning_rate": 1.120442119601108e-05, "loss": 1.3652, "step": 17493 }, { "epoch": 0.48, "learning_rate": 1.120354312300794e-05, "loss": 1.2378, "step": 17494 }, { "epoch": 0.48, "learning_rate": 1.1202665040588848e-05, "loss": 1.5088, "step": 17495 }, { "epoch": 0.48, "learning_rate": 1.1201786948760667e-05, "loss": 1.1504, "step": 17496 }, { "epoch": 0.48, "learning_rate": 1.1200908847530272e-05, "loss": 1.3323, "step": 17497 }, { "epoch": 0.48, "learning_rate": 1.1200030736904529e-05, "loss": 1.3672, "step": 17498 }, { "epoch": 0.48, "learning_rate": 1.1199152616890312e-05, "loss": 1.2795, "step": 17499 }, { "epoch": 0.48, "learning_rate": 1.1198274487494485e-05, "loss": 1.1799, "step": 17500 }, { "epoch": 0.48, "learning_rate": 1.1197396348723923e-05, "loss": 1.4075, "step": 17501 }, { "epoch": 0.48, "learning_rate": 1.1196518200585497e-05, "loss": 1.1335, "step": 17502 }, { "epoch": 0.48, "learning_rate": 1.1195640043086075e-05, "loss": 1.1835, "step": 17503 }, { "epoch": 0.48, "learning_rate": 1.1194761876232528e-05, "loss": 1.3054, "step": 17504 }, { "epoch": 0.48, "learning_rate": 1.1193883700031724e-05, "loss": 1.3992, "step": 17505 }, { "epoch": 0.48, "learning_rate": 1.1193005514490538e-05, "loss": 1.3276, "step": 17506 }, { "epoch": 0.48, "learning_rate": 1.1192127319615837e-05, "loss": 1.3403, "step": 17507 }, { "epoch": 0.48, "learning_rate": 1.1191249115414491e-05, "loss": 1.3032, "step": 17508 }, { "epoch": 0.48, "learning_rate": 1.1190370901893376e-05, "loss": 1.3293, "step": 17509 }, { "epoch": 0.48, "learning_rate": 1.1189492679059353e-05, "loss": 1.2598, "step": 17510 }, { "epoch": 0.48, "learning_rate": 1.1188614446919301e-05, "loss": 1.2957, "step": 17511 }, { "epoch": 0.48, "learning_rate": 1.118773620548009e-05, "loss": 1.3477, "step": 17512 }, { "epoch": 0.48, "learning_rate": 1.118685795474859e-05, "loss": 1.1997, "step": 17513 }, { "epoch": 0.48, "learning_rate": 1.1185979694731668e-05, "loss": 1.2542, "step": 17514 }, { "epoch": 0.48, "learning_rate": 1.11851014254362e-05, "loss": 1.3777, "step": 17515 }, { "epoch": 0.48, "learning_rate": 1.1184223146869055e-05, "loss": 1.3967, "step": 17516 }, { "epoch": 0.48, "learning_rate": 1.1183344859037105e-05, "loss": 1.3381, "step": 17517 }, { "epoch": 0.48, "learning_rate": 1.1182466561947223e-05, "loss": 1.2661, "step": 17518 }, { "epoch": 0.48, "learning_rate": 1.118158825560628e-05, "loss": 1.2393, "step": 17519 }, { "epoch": 0.48, "learning_rate": 1.1180709940021142e-05, "loss": 1.1929, "step": 17520 }, { "epoch": 0.48, "learning_rate": 1.1179831615198689e-05, "loss": 1.4062, "step": 17521 }, { "epoch": 0.48, "learning_rate": 1.1178953281145784e-05, "loss": 1.436, "step": 17522 }, { "epoch": 0.48, "learning_rate": 1.1178074937869305e-05, "loss": 1.3259, "step": 17523 }, { "epoch": 0.48, "learning_rate": 1.117719658537612e-05, "loss": 1.2214, "step": 17524 }, { "epoch": 0.48, "learning_rate": 1.1176318223673106e-05, "loss": 1.2322, "step": 17525 }, { "epoch": 0.48, "learning_rate": 1.117543985276713e-05, "loss": 1.095, "step": 17526 }, { "epoch": 0.48, "learning_rate": 1.1174561472665064e-05, "loss": 1.2114, "step": 17527 }, { "epoch": 0.48, "learning_rate": 1.1173683083373781e-05, "loss": 1.3472, "step": 17528 }, { "epoch": 0.48, "learning_rate": 1.1172804684900155e-05, "loss": 1.3582, "step": 17529 }, { "epoch": 0.48, "learning_rate": 1.1171926277251055e-05, "loss": 1.4414, "step": 17530 }, { "epoch": 0.48, "learning_rate": 1.1171047860433358e-05, "loss": 1.2056, "step": 17531 }, { "epoch": 0.48, "learning_rate": 1.1170169434453931e-05, "loss": 1.2833, "step": 17532 }, { "epoch": 0.48, "learning_rate": 1.1169290999319647e-05, "loss": 1.2917, "step": 17533 }, { "epoch": 0.48, "learning_rate": 1.1168412555037383e-05, "loss": 1.3325, "step": 17534 }, { "epoch": 0.48, "learning_rate": 1.1167534101614007e-05, "loss": 1.3186, "step": 17535 }, { "epoch": 0.48, "learning_rate": 1.1166655639056394e-05, "loss": 1.3125, "step": 17536 }, { "epoch": 0.48, "learning_rate": 1.1165777167371414e-05, "loss": 1.2002, "step": 17537 }, { "epoch": 0.48, "learning_rate": 1.1164898686565944e-05, "loss": 1.1583, "step": 17538 }, { "epoch": 0.48, "learning_rate": 1.1164020196646854e-05, "loss": 1.3567, "step": 17539 }, { "epoch": 0.48, "learning_rate": 1.1163141697621016e-05, "loss": 1.3953, "step": 17540 }, { "epoch": 0.48, "learning_rate": 1.1162263189495306e-05, "loss": 1.3948, "step": 17541 }, { "epoch": 0.48, "learning_rate": 1.1161384672276593e-05, "loss": 1.1677, "step": 17542 }, { "epoch": 0.48, "learning_rate": 1.1160506145971757e-05, "loss": 1.6289, "step": 17543 }, { "epoch": 0.48, "learning_rate": 1.1159627610587662e-05, "loss": 1.2471, "step": 17544 }, { "epoch": 0.48, "learning_rate": 1.1158749066131189e-05, "loss": 1.2554, "step": 17545 }, { "epoch": 0.48, "learning_rate": 1.1157870512609207e-05, "loss": 1.3535, "step": 17546 }, { "epoch": 0.48, "learning_rate": 1.115699195002859e-05, "loss": 1.1846, "step": 17547 }, { "epoch": 0.48, "learning_rate": 1.1156113378396211e-05, "loss": 1.2388, "step": 17548 }, { "epoch": 0.48, "learning_rate": 1.1155234797718946e-05, "loss": 1.1895, "step": 17549 }, { "epoch": 0.48, "learning_rate": 1.1154356208003667e-05, "loss": 1.292, "step": 17550 }, { "epoch": 0.48, "learning_rate": 1.1153477609257246e-05, "loss": 1.2236, "step": 17551 }, { "epoch": 0.48, "learning_rate": 1.1152599001486564e-05, "loss": 1.3745, "step": 17552 }, { "epoch": 0.48, "learning_rate": 1.1151720384698483e-05, "loss": 1.2354, "step": 17553 }, { "epoch": 0.48, "learning_rate": 1.1150841758899888e-05, "loss": 1.2893, "step": 17554 }, { "epoch": 0.48, "learning_rate": 1.1149963124097644e-05, "loss": 1.187, "step": 17555 }, { "epoch": 0.48, "learning_rate": 1.1149084480298636e-05, "loss": 1.2046, "step": 17556 }, { "epoch": 0.48, "learning_rate": 1.1148205827509724e-05, "loss": 1.335, "step": 17557 }, { "epoch": 0.48, "learning_rate": 1.1147327165737793e-05, "loss": 1.3967, "step": 17558 }, { "epoch": 0.48, "learning_rate": 1.1146448494989715e-05, "loss": 1.3298, "step": 17559 }, { "epoch": 0.48, "learning_rate": 1.1145569815272362e-05, "loss": 1.4004, "step": 17560 }, { "epoch": 0.48, "learning_rate": 1.1144691126592608e-05, "loss": 1.2583, "step": 17561 }, { "epoch": 0.48, "learning_rate": 1.114381242895733e-05, "loss": 1.3989, "step": 17562 }, { "epoch": 0.48, "learning_rate": 1.1142933722373399e-05, "loss": 1.3237, "step": 17563 }, { "epoch": 0.48, "learning_rate": 1.1142055006847694e-05, "loss": 1.2524, "step": 17564 }, { "epoch": 0.48, "learning_rate": 1.1141176282387087e-05, "loss": 1.3372, "step": 17565 }, { "epoch": 0.48, "learning_rate": 1.1140297548998456e-05, "loss": 1.208, "step": 17566 }, { "epoch": 0.48, "learning_rate": 1.1139418806688671e-05, "loss": 1.3533, "step": 17567 }, { "epoch": 0.48, "learning_rate": 1.1138540055464611e-05, "loss": 1.1907, "step": 17568 }, { "epoch": 0.48, "learning_rate": 1.1137661295333147e-05, "loss": 1.3853, "step": 17569 }, { "epoch": 0.48, "learning_rate": 1.1136782526301158e-05, "loss": 1.3701, "step": 17570 }, { "epoch": 0.48, "learning_rate": 1.1135903748375514e-05, "loss": 1.2168, "step": 17571 }, { "epoch": 0.48, "learning_rate": 1.1135024961563094e-05, "loss": 1.1838, "step": 17572 }, { "epoch": 0.48, "learning_rate": 1.1134146165870774e-05, "loss": 1.2727, "step": 17573 }, { "epoch": 0.48, "learning_rate": 1.1133267361305426e-05, "loss": 1.0929, "step": 17574 }, { "epoch": 0.48, "learning_rate": 1.1132388547873928e-05, "loss": 1.4045, "step": 17575 }, { "epoch": 0.48, "learning_rate": 1.1131509725583156e-05, "loss": 1.7603, "step": 17576 }, { "epoch": 0.48, "learning_rate": 1.113063089443998e-05, "loss": 1.2222, "step": 17577 }, { "epoch": 0.48, "learning_rate": 1.1129752054451284e-05, "loss": 1.167, "step": 17578 }, { "epoch": 0.48, "learning_rate": 1.1128873205623933e-05, "loss": 1.2351, "step": 17579 }, { "epoch": 0.48, "learning_rate": 1.1127994347964814e-05, "loss": 1.2778, "step": 17580 }, { "epoch": 0.48, "learning_rate": 1.1127115481480797e-05, "loss": 1.3389, "step": 17581 }, { "epoch": 0.48, "learning_rate": 1.112623660617876e-05, "loss": 1.3689, "step": 17582 }, { "epoch": 0.48, "learning_rate": 1.1125357722065573e-05, "loss": 1.3149, "step": 17583 }, { "epoch": 0.48, "learning_rate": 1.1124478829148119e-05, "loss": 1.2739, "step": 17584 }, { "epoch": 0.48, "learning_rate": 1.1123599927433273e-05, "loss": 1.189, "step": 17585 }, { "epoch": 0.48, "learning_rate": 1.1122721016927908e-05, "loss": 1.3245, "step": 17586 }, { "epoch": 0.48, "learning_rate": 1.11218420976389e-05, "loss": 1.2469, "step": 17587 }, { "epoch": 0.48, "learning_rate": 1.1120963169573131e-05, "loss": 1.1589, "step": 17588 }, { "epoch": 0.48, "learning_rate": 1.112008423273747e-05, "loss": 1.2832, "step": 17589 }, { "epoch": 0.48, "learning_rate": 1.1119205287138796e-05, "loss": 1.2981, "step": 17590 }, { "epoch": 0.48, "learning_rate": 1.111832633278399e-05, "loss": 1.353, "step": 17591 }, { "epoch": 0.48, "learning_rate": 1.1117447369679922e-05, "loss": 1.313, "step": 17592 }, { "epoch": 0.48, "learning_rate": 1.111656839783347e-05, "loss": 1.2329, "step": 17593 }, { "epoch": 0.48, "learning_rate": 1.1115689417251512e-05, "loss": 1.2505, "step": 17594 }, { "epoch": 0.48, "learning_rate": 1.1114810427940928e-05, "loss": 1.3462, "step": 17595 }, { "epoch": 0.48, "learning_rate": 1.111393142990859e-05, "loss": 1.3535, "step": 17596 }, { "epoch": 0.48, "learning_rate": 1.1113052423161374e-05, "loss": 1.1812, "step": 17597 }, { "epoch": 0.48, "learning_rate": 1.1112173407706161e-05, "loss": 1.3591, "step": 17598 }, { "epoch": 0.48, "learning_rate": 1.1111294383549827e-05, "loss": 1.3247, "step": 17599 }, { "epoch": 0.48, "learning_rate": 1.1110415350699246e-05, "loss": 1.3396, "step": 17600 }, { "epoch": 0.48, "learning_rate": 1.11095363091613e-05, "loss": 1.3616, "step": 17601 }, { "epoch": 0.48, "learning_rate": 1.1108657258942861e-05, "loss": 1.2993, "step": 17602 }, { "epoch": 0.48, "learning_rate": 1.1107778200050812e-05, "loss": 1.4817, "step": 17603 }, { "epoch": 0.48, "learning_rate": 1.1106899132492025e-05, "loss": 1.3538, "step": 17604 }, { "epoch": 0.48, "learning_rate": 1.110602005627338e-05, "loss": 1.384, "step": 17605 }, { "epoch": 0.48, "learning_rate": 1.1105140971401756e-05, "loss": 1.2356, "step": 17606 }, { "epoch": 0.48, "learning_rate": 1.1104261877884028e-05, "loss": 1.4055, "step": 17607 }, { "epoch": 0.48, "learning_rate": 1.1103382775727071e-05, "loss": 1.3691, "step": 17608 }, { "epoch": 0.48, "learning_rate": 1.1102503664937771e-05, "loss": 1.3865, "step": 17609 }, { "epoch": 0.48, "learning_rate": 1.1101624545522996e-05, "loss": 1.3682, "step": 17610 }, { "epoch": 0.48, "learning_rate": 1.1100745417489631e-05, "loss": 1.3135, "step": 17611 }, { "epoch": 0.48, "learning_rate": 1.1099866280844552e-05, "loss": 1.4644, "step": 17612 }, { "epoch": 0.48, "learning_rate": 1.1098987135594636e-05, "loss": 1.3926, "step": 17613 }, { "epoch": 0.48, "learning_rate": 1.1098107981746762e-05, "loss": 1.353, "step": 17614 }, { "epoch": 0.48, "learning_rate": 1.1097228819307808e-05, "loss": 1.3416, "step": 17615 }, { "epoch": 0.48, "learning_rate": 1.1096349648284648e-05, "loss": 1.1519, "step": 17616 }, { "epoch": 0.48, "learning_rate": 1.1095470468684169e-05, "loss": 1.4175, "step": 17617 }, { "epoch": 0.48, "learning_rate": 1.109459128051324e-05, "loss": 1.3677, "step": 17618 }, { "epoch": 0.48, "learning_rate": 1.1093712083778748e-05, "loss": 1.3281, "step": 17619 }, { "epoch": 0.48, "learning_rate": 1.109283287848756e-05, "loss": 1.3464, "step": 17620 }, { "epoch": 0.48, "learning_rate": 1.1091953664646569e-05, "loss": 1.1521, "step": 17621 }, { "epoch": 0.48, "learning_rate": 1.1091074442262641e-05, "loss": 1.239, "step": 17622 }, { "epoch": 0.48, "learning_rate": 1.1090195211342663e-05, "loss": 1.3125, "step": 17623 }, { "epoch": 0.48, "learning_rate": 1.1089315971893507e-05, "loss": 1.2268, "step": 17624 }, { "epoch": 0.48, "learning_rate": 1.1088436723922054e-05, "loss": 1.2839, "step": 17625 }, { "epoch": 0.48, "learning_rate": 1.1087557467435186e-05, "loss": 1.3069, "step": 17626 }, { "epoch": 0.48, "learning_rate": 1.1086678202439782e-05, "loss": 1.1514, "step": 17627 }, { "epoch": 0.48, "learning_rate": 1.1085798928942715e-05, "loss": 1.2307, "step": 17628 }, { "epoch": 0.48, "learning_rate": 1.1084919646950871e-05, "loss": 1.3254, "step": 17629 }, { "epoch": 0.48, "learning_rate": 1.1084040356471124e-05, "loss": 1.28, "step": 17630 }, { "epoch": 0.48, "learning_rate": 1.1083161057510357e-05, "loss": 1.2644, "step": 17631 }, { "epoch": 0.48, "learning_rate": 1.1082281750075446e-05, "loss": 1.3018, "step": 17632 }, { "epoch": 0.48, "learning_rate": 1.1081402434173272e-05, "loss": 1.3787, "step": 17633 }, { "epoch": 0.48, "learning_rate": 1.108052310981071e-05, "loss": 1.1902, "step": 17634 }, { "epoch": 0.48, "learning_rate": 1.1079643776994648e-05, "loss": 1.3354, "step": 17635 }, { "epoch": 0.48, "learning_rate": 1.1078764435731959e-05, "loss": 1.2202, "step": 17636 }, { "epoch": 0.48, "learning_rate": 1.1077885086029525e-05, "loss": 1.2859, "step": 17637 }, { "epoch": 0.48, "learning_rate": 1.1077005727894224e-05, "loss": 1.4094, "step": 17638 }, { "epoch": 0.48, "learning_rate": 1.1076126361332937e-05, "loss": 1.3154, "step": 17639 }, { "epoch": 0.48, "learning_rate": 1.1075246986352543e-05, "loss": 1.2939, "step": 17640 }, { "epoch": 0.48, "learning_rate": 1.1074367602959924e-05, "loss": 1.3472, "step": 17641 }, { "epoch": 0.48, "learning_rate": 1.1073488211161955e-05, "loss": 1.262, "step": 17642 }, { "epoch": 0.48, "learning_rate": 1.1072608810965522e-05, "loss": 1.1899, "step": 17643 }, { "epoch": 0.48, "learning_rate": 1.10717294023775e-05, "loss": 1.2039, "step": 17644 }, { "epoch": 0.48, "learning_rate": 1.1070849985404773e-05, "loss": 1.2202, "step": 17645 }, { "epoch": 0.48, "learning_rate": 1.106997056005422e-05, "loss": 1.3918, "step": 17646 }, { "epoch": 0.48, "learning_rate": 1.1069091126332717e-05, "loss": 1.4368, "step": 17647 }, { "epoch": 0.48, "learning_rate": 1.106821168424715e-05, "loss": 1.2114, "step": 17648 }, { "epoch": 0.48, "learning_rate": 1.1067332233804396e-05, "loss": 1.3486, "step": 17649 }, { "epoch": 0.48, "learning_rate": 1.1066452775011339e-05, "loss": 1.1992, "step": 17650 }, { "epoch": 0.48, "learning_rate": 1.1065573307874852e-05, "loss": 1.3137, "step": 17651 }, { "epoch": 0.48, "learning_rate": 1.1064693832401825e-05, "loss": 1.6455, "step": 17652 }, { "epoch": 0.48, "learning_rate": 1.106381434859913e-05, "loss": 1.3782, "step": 17653 }, { "epoch": 0.48, "learning_rate": 1.1062934856473655e-05, "loss": 1.2727, "step": 17654 }, { "epoch": 0.48, "learning_rate": 1.1062055356032277e-05, "loss": 1.2817, "step": 17655 }, { "epoch": 0.48, "learning_rate": 1.1061175847281877e-05, "loss": 1.3083, "step": 17656 }, { "epoch": 0.48, "learning_rate": 1.1060296330229336e-05, "loss": 1.3794, "step": 17657 }, { "epoch": 0.48, "learning_rate": 1.1059416804881535e-05, "loss": 1.416, "step": 17658 }, { "epoch": 0.48, "learning_rate": 1.1058537271245356e-05, "loss": 1.2021, "step": 17659 }, { "epoch": 0.48, "learning_rate": 1.105765772932768e-05, "loss": 1.2092, "step": 17660 }, { "epoch": 0.48, "learning_rate": 1.1056778179135385e-05, "loss": 1.3882, "step": 17661 }, { "epoch": 0.48, "learning_rate": 1.1055898620675355e-05, "loss": 1.269, "step": 17662 }, { "epoch": 0.48, "learning_rate": 1.1055019053954473e-05, "loss": 1.1719, "step": 17663 }, { "epoch": 0.48, "learning_rate": 1.1054139478979615e-05, "loss": 1.2388, "step": 17664 }, { "epoch": 0.48, "learning_rate": 1.1053259895757666e-05, "loss": 1.2695, "step": 17665 }, { "epoch": 0.48, "learning_rate": 1.1052380304295509e-05, "loss": 1.2786, "step": 17666 }, { "epoch": 0.48, "learning_rate": 1.105150070460002e-05, "loss": 1.3352, "step": 17667 }, { "epoch": 0.48, "learning_rate": 1.1050621096678087e-05, "loss": 1.2607, "step": 17668 }, { "epoch": 0.48, "learning_rate": 1.1049741480536586e-05, "loss": 1.2576, "step": 17669 }, { "epoch": 0.48, "learning_rate": 1.1048861856182404e-05, "loss": 1.2119, "step": 17670 }, { "epoch": 0.48, "learning_rate": 1.1047982223622418e-05, "loss": 1.4961, "step": 17671 }, { "epoch": 0.48, "learning_rate": 1.1047102582863512e-05, "loss": 1.2681, "step": 17672 }, { "epoch": 0.48, "learning_rate": 1.1046222933912567e-05, "loss": 1.1824, "step": 17673 }, { "epoch": 0.48, "learning_rate": 1.1045343276776467e-05, "loss": 1.4048, "step": 17674 }, { "epoch": 0.48, "learning_rate": 1.1044463611462093e-05, "loss": 1.2717, "step": 17675 }, { "epoch": 0.48, "learning_rate": 1.1043583937976328e-05, "loss": 1.3606, "step": 17676 }, { "epoch": 0.48, "learning_rate": 1.104270425632605e-05, "loss": 1.4058, "step": 17677 }, { "epoch": 0.48, "learning_rate": 1.1041824566518146e-05, "loss": 1.2295, "step": 17678 }, { "epoch": 0.48, "learning_rate": 1.1040944868559498e-05, "loss": 1.2527, "step": 17679 }, { "epoch": 0.48, "learning_rate": 1.1040065162456986e-05, "loss": 1.1832, "step": 17680 }, { "epoch": 0.48, "learning_rate": 1.103918544821749e-05, "loss": 1.219, "step": 17681 }, { "epoch": 0.48, "learning_rate": 1.10383057258479e-05, "loss": 1.3142, "step": 17682 }, { "epoch": 0.48, "learning_rate": 1.1037425995355091e-05, "loss": 1.5132, "step": 17683 }, { "epoch": 0.48, "learning_rate": 1.1036546256745953e-05, "loss": 1.3933, "step": 17684 }, { "epoch": 0.48, "learning_rate": 1.1035666510027359e-05, "loss": 1.2532, "step": 17685 }, { "epoch": 0.48, "learning_rate": 1.1034786755206202e-05, "loss": 1.1105, "step": 17686 }, { "epoch": 0.48, "learning_rate": 1.1033906992289354e-05, "loss": 1.428, "step": 17687 }, { "epoch": 0.48, "learning_rate": 1.103302722128371e-05, "loss": 1.3127, "step": 17688 }, { "epoch": 0.48, "learning_rate": 1.1032147442196145e-05, "loss": 1.1942, "step": 17689 }, { "epoch": 0.48, "learning_rate": 1.1031267655033541e-05, "loss": 1.1089, "step": 17690 }, { "epoch": 0.48, "learning_rate": 1.1030387859802787e-05, "loss": 1.3018, "step": 17691 }, { "epoch": 0.48, "learning_rate": 1.1029508056510762e-05, "loss": 1.2188, "step": 17692 }, { "epoch": 0.48, "learning_rate": 1.102862824516435e-05, "loss": 1.2964, "step": 17693 }, { "epoch": 0.48, "learning_rate": 1.1027748425770434e-05, "loss": 1.2502, "step": 17694 }, { "epoch": 0.48, "learning_rate": 1.1026868598335899e-05, "loss": 1.1621, "step": 17695 }, { "epoch": 0.48, "learning_rate": 1.1025988762867628e-05, "loss": 1.1836, "step": 17696 }, { "epoch": 0.48, "learning_rate": 1.1025108919372501e-05, "loss": 1.364, "step": 17697 }, { "epoch": 0.48, "learning_rate": 1.1024229067857403e-05, "loss": 1.2107, "step": 17698 }, { "epoch": 0.48, "learning_rate": 1.102334920832922e-05, "loss": 1.4702, "step": 17699 }, { "epoch": 0.48, "learning_rate": 1.1022469340794835e-05, "loss": 1.2292, "step": 17700 }, { "epoch": 0.48, "learning_rate": 1.1021589465261128e-05, "loss": 1.1271, "step": 17701 }, { "epoch": 0.48, "learning_rate": 1.1020709581734987e-05, "loss": 1.3699, "step": 17702 }, { "epoch": 0.48, "learning_rate": 1.1019829690223293e-05, "loss": 1.323, "step": 17703 }, { "epoch": 0.48, "learning_rate": 1.1018949790732932e-05, "loss": 1.4924, "step": 17704 }, { "epoch": 0.48, "learning_rate": 1.1018069883270788e-05, "loss": 1.3286, "step": 17705 }, { "epoch": 0.48, "learning_rate": 1.1017189967843742e-05, "loss": 1.4932, "step": 17706 }, { "epoch": 0.48, "learning_rate": 1.1016310044458683e-05, "loss": 1.1792, "step": 17707 }, { "epoch": 0.48, "learning_rate": 1.1015430113122487e-05, "loss": 1.3291, "step": 17708 }, { "epoch": 0.48, "learning_rate": 1.101455017384205e-05, "loss": 1.2683, "step": 17709 }, { "epoch": 0.48, "learning_rate": 1.1013670226624242e-05, "loss": 1.3308, "step": 17710 }, { "epoch": 0.48, "learning_rate": 1.1012790271475962e-05, "loss": 1.2588, "step": 17711 }, { "epoch": 0.48, "learning_rate": 1.101191030840408e-05, "loss": 1.2705, "step": 17712 }, { "epoch": 0.48, "learning_rate": 1.1011030337415494e-05, "loss": 1.2678, "step": 17713 }, { "epoch": 0.48, "learning_rate": 1.101015035851708e-05, "loss": 1.0801, "step": 17714 }, { "epoch": 0.48, "learning_rate": 1.1009270371715724e-05, "loss": 1.3948, "step": 17715 }, { "epoch": 0.48, "learning_rate": 1.1008390377018309e-05, "loss": 1.395, "step": 17716 }, { "epoch": 0.48, "learning_rate": 1.1007510374431727e-05, "loss": 1.3254, "step": 17717 }, { "epoch": 0.48, "learning_rate": 1.1006630363962854e-05, "loss": 1.3059, "step": 17718 }, { "epoch": 0.48, "learning_rate": 1.1005750345618577e-05, "loss": 1.3462, "step": 17719 }, { "epoch": 0.48, "learning_rate": 1.1004870319405785e-05, "loss": 1.3584, "step": 17720 }, { "epoch": 0.48, "learning_rate": 1.100399028533136e-05, "loss": 1.438, "step": 17721 }, { "epoch": 0.48, "learning_rate": 1.1003110243402187e-05, "loss": 1.3975, "step": 17722 }, { "epoch": 0.48, "learning_rate": 1.100223019362515e-05, "loss": 1.1855, "step": 17723 }, { "epoch": 0.48, "learning_rate": 1.1001350136007136e-05, "loss": 1.3333, "step": 17724 }, { "epoch": 0.48, "learning_rate": 1.100047007055503e-05, "loss": 1.2656, "step": 17725 }, { "epoch": 0.48, "learning_rate": 1.0999589997275715e-05, "loss": 1.3223, "step": 17726 }, { "epoch": 0.48, "learning_rate": 1.099870991617608e-05, "loss": 1.4502, "step": 17727 }, { "epoch": 0.48, "learning_rate": 1.0997829827263006e-05, "loss": 1.2158, "step": 17728 }, { "epoch": 0.48, "learning_rate": 1.0996949730543383e-05, "loss": 1.2783, "step": 17729 }, { "epoch": 0.48, "learning_rate": 1.0996069626024092e-05, "loss": 1.3074, "step": 17730 }, { "epoch": 0.48, "learning_rate": 1.0995189513712024e-05, "loss": 1.3032, "step": 17731 }, { "epoch": 0.48, "learning_rate": 1.0994309393614058e-05, "loss": 1.3264, "step": 17732 }, { "epoch": 0.48, "learning_rate": 1.0993429265737083e-05, "loss": 1.3704, "step": 17733 }, { "epoch": 0.48, "learning_rate": 1.0992549130087983e-05, "loss": 1.323, "step": 17734 }, { "epoch": 0.48, "learning_rate": 1.099166898667365e-05, "loss": 1.1409, "step": 17735 }, { "epoch": 0.48, "learning_rate": 1.099078883550096e-05, "loss": 1.2986, "step": 17736 }, { "epoch": 0.48, "learning_rate": 1.0989908676576808e-05, "loss": 1.4238, "step": 17737 }, { "epoch": 0.48, "learning_rate": 1.0989028509908075e-05, "loss": 1.3037, "step": 17738 }, { "epoch": 0.48, "learning_rate": 1.0988148335501646e-05, "loss": 1.3215, "step": 17739 }, { "epoch": 0.48, "learning_rate": 1.0987268153364412e-05, "loss": 1.3337, "step": 17740 }, { "epoch": 0.48, "learning_rate": 1.0986387963503255e-05, "loss": 1.4062, "step": 17741 }, { "epoch": 0.48, "learning_rate": 1.0985507765925063e-05, "loss": 1.3291, "step": 17742 }, { "epoch": 0.48, "learning_rate": 1.0984627560636722e-05, "loss": 1.2122, "step": 17743 }, { "epoch": 0.48, "learning_rate": 1.0983747347645117e-05, "loss": 1.2415, "step": 17744 }, { "epoch": 0.48, "learning_rate": 1.0982867126957134e-05, "loss": 1.3, "step": 17745 }, { "epoch": 0.48, "learning_rate": 1.0981986898579663e-05, "loss": 1.4409, "step": 17746 }, { "epoch": 0.48, "learning_rate": 1.098110666251959e-05, "loss": 1.3643, "step": 17747 }, { "epoch": 0.48, "learning_rate": 1.0980226418783795e-05, "loss": 1.3394, "step": 17748 }, { "epoch": 0.48, "learning_rate": 1.0979346167379173e-05, "loss": 1.2039, "step": 17749 }, { "epoch": 0.48, "learning_rate": 1.0978465908312606e-05, "loss": 1.3174, "step": 17750 }, { "epoch": 0.48, "learning_rate": 1.097758564159098e-05, "loss": 1.3958, "step": 17751 }, { "epoch": 0.48, "learning_rate": 1.0976705367221185e-05, "loss": 1.2817, "step": 17752 }, { "epoch": 0.48, "learning_rate": 1.0975825085210108e-05, "loss": 1.271, "step": 17753 }, { "epoch": 0.48, "learning_rate": 1.0974944795564633e-05, "loss": 1.1855, "step": 17754 }, { "epoch": 0.48, "learning_rate": 1.0974064498291648e-05, "loss": 1.4685, "step": 17755 }, { "epoch": 0.48, "learning_rate": 1.0973184193398044e-05, "loss": 1.2688, "step": 17756 }, { "epoch": 0.48, "learning_rate": 1.0972303880890697e-05, "loss": 1.3293, "step": 17757 }, { "epoch": 0.48, "learning_rate": 1.0971423560776509e-05, "loss": 1.3564, "step": 17758 }, { "epoch": 0.48, "learning_rate": 1.0970543233062356e-05, "loss": 1.3311, "step": 17759 }, { "epoch": 0.49, "learning_rate": 1.096966289775513e-05, "loss": 1.2637, "step": 17760 }, { "epoch": 0.49, "learning_rate": 1.0968782554861719e-05, "loss": 1.3462, "step": 17761 }, { "epoch": 0.49, "learning_rate": 1.0967902204389007e-05, "loss": 1.366, "step": 17762 }, { "epoch": 0.49, "learning_rate": 1.0967021846343884e-05, "loss": 1.2488, "step": 17763 }, { "epoch": 0.49, "learning_rate": 1.0966141480733236e-05, "loss": 1.4302, "step": 17764 }, { "epoch": 0.49, "learning_rate": 1.096526110756395e-05, "loss": 1.2778, "step": 17765 }, { "epoch": 0.49, "learning_rate": 1.0964380726842917e-05, "loss": 1.344, "step": 17766 }, { "epoch": 0.49, "learning_rate": 1.0963500338577022e-05, "loss": 1.2949, "step": 17767 }, { "epoch": 0.49, "learning_rate": 1.0962619942773157e-05, "loss": 1.3135, "step": 17768 }, { "epoch": 0.49, "learning_rate": 1.0961739539438201e-05, "loss": 1.2305, "step": 17769 }, { "epoch": 0.49, "learning_rate": 1.0960859128579049e-05, "loss": 1.3516, "step": 17770 }, { "epoch": 0.49, "learning_rate": 1.0959978710202588e-05, "loss": 1.1477, "step": 17771 }, { "epoch": 0.49, "learning_rate": 1.0959098284315705e-05, "loss": 1.355, "step": 17772 }, { "epoch": 0.49, "learning_rate": 1.0958217850925285e-05, "loss": 1.4741, "step": 17773 }, { "epoch": 0.49, "learning_rate": 1.0957337410038225e-05, "loss": 1.2476, "step": 17774 }, { "epoch": 0.49, "learning_rate": 1.0956456961661402e-05, "loss": 1.2698, "step": 17775 }, { "epoch": 0.49, "learning_rate": 1.0955576505801711e-05, "loss": 1.1836, "step": 17776 }, { "epoch": 0.49, "learning_rate": 1.0954696042466037e-05, "loss": 1.3831, "step": 17777 }, { "epoch": 0.49, "learning_rate": 1.0953815571661275e-05, "loss": 1.3608, "step": 17778 }, { "epoch": 0.49, "learning_rate": 1.0952935093394304e-05, "loss": 1.1672, "step": 17779 }, { "epoch": 0.49, "learning_rate": 1.095205460767202e-05, "loss": 1.1956, "step": 17780 }, { "epoch": 0.49, "learning_rate": 1.0951174114501304e-05, "loss": 1.3643, "step": 17781 }, { "epoch": 0.49, "learning_rate": 1.0950293613889053e-05, "loss": 1.2754, "step": 17782 }, { "epoch": 0.49, "learning_rate": 1.0949413105842148e-05, "loss": 1.2327, "step": 17783 }, { "epoch": 0.49, "learning_rate": 1.0948532590367486e-05, "loss": 1.3125, "step": 17784 }, { "epoch": 0.49, "learning_rate": 1.0947652067471948e-05, "loss": 1.4636, "step": 17785 }, { "epoch": 0.49, "learning_rate": 1.0946771537162429e-05, "loss": 1.3557, "step": 17786 }, { "epoch": 0.49, "learning_rate": 1.094589099944581e-05, "loss": 1.3245, "step": 17787 }, { "epoch": 0.49, "learning_rate": 1.0945010454328988e-05, "loss": 1.2429, "step": 17788 }, { "epoch": 0.49, "learning_rate": 1.0944129901818847e-05, "loss": 1.3281, "step": 17789 }, { "epoch": 0.49, "learning_rate": 1.0943249341922279e-05, "loss": 1.1672, "step": 17790 }, { "epoch": 0.49, "learning_rate": 1.094236877464617e-05, "loss": 1.4172, "step": 17791 }, { "epoch": 0.49, "learning_rate": 1.0941488199997414e-05, "loss": 1.376, "step": 17792 }, { "epoch": 0.49, "learning_rate": 1.0940607617982893e-05, "loss": 1.321, "step": 17793 }, { "epoch": 0.49, "learning_rate": 1.0939727028609504e-05, "loss": 1.4141, "step": 17794 }, { "epoch": 0.49, "learning_rate": 1.093884643188413e-05, "loss": 1.2825, "step": 17795 }, { "epoch": 0.49, "learning_rate": 1.0937965827813661e-05, "loss": 1.1809, "step": 17796 }, { "epoch": 0.49, "learning_rate": 1.0937085216404993e-05, "loss": 1.2229, "step": 17797 }, { "epoch": 0.49, "learning_rate": 1.0936204597665007e-05, "loss": 1.1289, "step": 17798 }, { "epoch": 0.49, "learning_rate": 1.09353239716006e-05, "loss": 1.2434, "step": 17799 }, { "epoch": 0.49, "learning_rate": 1.0934443338218656e-05, "loss": 1.2942, "step": 17800 }, { "epoch": 0.49, "learning_rate": 1.0933562697526068e-05, "loss": 1.1516, "step": 17801 }, { "epoch": 0.49, "learning_rate": 1.0932682049529723e-05, "loss": 1.3857, "step": 17802 }, { "epoch": 0.49, "learning_rate": 1.0931801394236512e-05, "loss": 1.3806, "step": 17803 }, { "epoch": 0.49, "learning_rate": 1.0930920731653326e-05, "loss": 1.3027, "step": 17804 }, { "epoch": 0.49, "learning_rate": 1.0930040061787055e-05, "loss": 1.3997, "step": 17805 }, { "epoch": 0.49, "learning_rate": 1.0929159384644588e-05, "loss": 1.3291, "step": 17806 }, { "epoch": 0.49, "learning_rate": 1.0928278700232813e-05, "loss": 1.4749, "step": 17807 }, { "epoch": 0.49, "learning_rate": 1.0927398008558623e-05, "loss": 1.2468, "step": 17808 }, { "epoch": 0.49, "learning_rate": 1.0926517309628905e-05, "loss": 1.2026, "step": 17809 }, { "epoch": 0.49, "learning_rate": 1.0925636603450555e-05, "loss": 1.377, "step": 17810 }, { "epoch": 0.49, "learning_rate": 1.0924755890030457e-05, "loss": 1.2888, "step": 17811 }, { "epoch": 0.49, "learning_rate": 1.0923875169375502e-05, "loss": 1.3745, "step": 17812 }, { "epoch": 0.49, "learning_rate": 1.0922994441492587e-05, "loss": 1.048, "step": 17813 }, { "epoch": 0.49, "learning_rate": 1.0922113706388594e-05, "loss": 1.6538, "step": 17814 }, { "epoch": 0.49, "learning_rate": 1.092123296407042e-05, "loss": 1.2727, "step": 17815 }, { "epoch": 0.49, "learning_rate": 1.0920352214544946e-05, "loss": 1.2888, "step": 17816 }, { "epoch": 0.49, "learning_rate": 1.0919471457819077e-05, "loss": 1.1926, "step": 17817 }, { "epoch": 0.49, "learning_rate": 1.091859069389969e-05, "loss": 1.4316, "step": 17818 }, { "epoch": 0.49, "learning_rate": 1.0917709922793685e-05, "loss": 1.3159, "step": 17819 }, { "epoch": 0.49, "learning_rate": 1.0916829144507947e-05, "loss": 1.2598, "step": 17820 }, { "epoch": 0.49, "learning_rate": 1.0915948359049372e-05, "loss": 1.2725, "step": 17821 }, { "epoch": 0.49, "learning_rate": 1.0915067566424841e-05, "loss": 1.3083, "step": 17822 }, { "epoch": 0.49, "learning_rate": 1.091418676664126e-05, "loss": 1.4568, "step": 17823 }, { "epoch": 0.49, "learning_rate": 1.0913305959705505e-05, "loss": 1.2795, "step": 17824 }, { "epoch": 0.49, "learning_rate": 1.0912425145624477e-05, "loss": 1.4875, "step": 17825 }, { "epoch": 0.49, "learning_rate": 1.0911544324405061e-05, "loss": 1.2954, "step": 17826 }, { "epoch": 0.49, "learning_rate": 1.0910663496054152e-05, "loss": 1.269, "step": 17827 }, { "epoch": 0.49, "learning_rate": 1.090978266057864e-05, "loss": 1.3113, "step": 17828 }, { "epoch": 0.49, "learning_rate": 1.0908901817985419e-05, "loss": 1.6704, "step": 17829 }, { "epoch": 0.49, "learning_rate": 1.0908020968281374e-05, "loss": 1.2954, "step": 17830 }, { "epoch": 0.49, "learning_rate": 1.0907140111473402e-05, "loss": 1.2686, "step": 17831 }, { "epoch": 0.49, "learning_rate": 1.0906259247568391e-05, "loss": 1.2595, "step": 17832 }, { "epoch": 0.49, "learning_rate": 1.0905378376573237e-05, "loss": 1.4639, "step": 17833 }, { "epoch": 0.49, "learning_rate": 1.0904497498494824e-05, "loss": 1.3987, "step": 17834 }, { "epoch": 0.49, "learning_rate": 1.090361661334005e-05, "loss": 1.3425, "step": 17835 }, { "epoch": 0.49, "learning_rate": 1.0902735721115805e-05, "loss": 1.3235, "step": 17836 }, { "epoch": 0.49, "learning_rate": 1.0901854821828981e-05, "loss": 1.2717, "step": 17837 }, { "epoch": 0.49, "learning_rate": 1.0900973915486466e-05, "loss": 1.2559, "step": 17838 }, { "epoch": 0.49, "learning_rate": 1.0900093002095158e-05, "loss": 1.4099, "step": 17839 }, { "epoch": 0.49, "learning_rate": 1.0899212081661943e-05, "loss": 1.2808, "step": 17840 }, { "epoch": 0.49, "learning_rate": 1.0898331154193717e-05, "loss": 1.1329, "step": 17841 }, { "epoch": 0.49, "learning_rate": 1.0897450219697367e-05, "loss": 1.1411, "step": 17842 }, { "epoch": 0.49, "learning_rate": 1.0896569278179791e-05, "loss": 1.2363, "step": 17843 }, { "epoch": 0.49, "learning_rate": 1.0895688329647878e-05, "loss": 1.7236, "step": 17844 }, { "epoch": 0.49, "learning_rate": 1.0894807374108522e-05, "loss": 1.2676, "step": 17845 }, { "epoch": 0.49, "learning_rate": 1.0893926411568613e-05, "loss": 1.3435, "step": 17846 }, { "epoch": 0.49, "learning_rate": 1.0893045442035047e-05, "loss": 1.3748, "step": 17847 }, { "epoch": 0.49, "learning_rate": 1.089216446551471e-05, "loss": 1.184, "step": 17848 }, { "epoch": 0.49, "learning_rate": 1.08912834820145e-05, "loss": 1.2756, "step": 17849 }, { "epoch": 0.49, "learning_rate": 1.0890402491541305e-05, "loss": 1.1423, "step": 17850 }, { "epoch": 0.49, "learning_rate": 1.0889521494102022e-05, "loss": 1.1853, "step": 17851 }, { "epoch": 0.49, "learning_rate": 1.0888640489703537e-05, "loss": 1.2666, "step": 17852 }, { "epoch": 0.49, "learning_rate": 1.088775947835275e-05, "loss": 1.3601, "step": 17853 }, { "epoch": 0.49, "learning_rate": 1.0886878460056549e-05, "loss": 1.2695, "step": 17854 }, { "epoch": 0.49, "learning_rate": 1.0885997434821831e-05, "loss": 1.22, "step": 17855 }, { "epoch": 0.49, "learning_rate": 1.0885116402655483e-05, "loss": 1.7339, "step": 17856 }, { "epoch": 0.49, "learning_rate": 1.0884235363564402e-05, "loss": 1.3069, "step": 17857 }, { "epoch": 0.49, "learning_rate": 1.0883354317555477e-05, "loss": 1.3198, "step": 17858 }, { "epoch": 0.49, "learning_rate": 1.0882473264635603e-05, "loss": 1.2324, "step": 17859 }, { "epoch": 0.49, "learning_rate": 1.0881592204811675e-05, "loss": 1.3943, "step": 17860 }, { "epoch": 0.49, "learning_rate": 1.0880711138090583e-05, "loss": 1.1687, "step": 17861 }, { "epoch": 0.49, "learning_rate": 1.0879830064479222e-05, "loss": 1.2417, "step": 17862 }, { "epoch": 0.49, "learning_rate": 1.0878948983984483e-05, "loss": 1.2983, "step": 17863 }, { "epoch": 0.49, "learning_rate": 1.0878067896613262e-05, "loss": 1.2051, "step": 17864 }, { "epoch": 0.49, "learning_rate": 1.087718680237245e-05, "loss": 1.2937, "step": 17865 }, { "epoch": 0.49, "learning_rate": 1.0876305701268941e-05, "loss": 1.2266, "step": 17866 }, { "epoch": 0.49, "learning_rate": 1.0875424593309628e-05, "loss": 1.3291, "step": 17867 }, { "epoch": 0.49, "learning_rate": 1.0874543478501407e-05, "loss": 1.1733, "step": 17868 }, { "epoch": 0.49, "learning_rate": 1.0873662356851164e-05, "loss": 1.4595, "step": 17869 }, { "epoch": 0.49, "learning_rate": 1.0872781228365803e-05, "loss": 1.4814, "step": 17870 }, { "epoch": 0.49, "learning_rate": 1.0871900093052207e-05, "loss": 1.209, "step": 17871 }, { "epoch": 0.49, "learning_rate": 1.087101895091728e-05, "loss": 1.0452, "step": 17872 }, { "epoch": 0.49, "learning_rate": 1.0870137801967907e-05, "loss": 1.3398, "step": 17873 }, { "epoch": 0.49, "learning_rate": 1.0869256646210984e-05, "loss": 1.3069, "step": 17874 }, { "epoch": 0.49, "learning_rate": 1.0868375483653406e-05, "loss": 1.2634, "step": 17875 }, { "epoch": 0.49, "learning_rate": 1.0867494314302069e-05, "loss": 1.2551, "step": 17876 }, { "epoch": 0.49, "learning_rate": 1.0866613138163865e-05, "loss": 1.1863, "step": 17877 }, { "epoch": 0.49, "learning_rate": 1.0865731955245687e-05, "loss": 1.4529, "step": 17878 }, { "epoch": 0.49, "learning_rate": 1.0864850765554424e-05, "loss": 1.3428, "step": 17879 }, { "epoch": 0.49, "learning_rate": 1.0863969569096982e-05, "loss": 1.377, "step": 17880 }, { "epoch": 0.49, "learning_rate": 1.0863088365880245e-05, "loss": 1.4143, "step": 17881 }, { "epoch": 0.49, "learning_rate": 1.0862207155911112e-05, "loss": 1.2253, "step": 17882 }, { "epoch": 0.49, "learning_rate": 1.0861325939196475e-05, "loss": 1.4907, "step": 17883 }, { "epoch": 0.49, "learning_rate": 1.0860444715743227e-05, "loss": 1.3826, "step": 17884 }, { "epoch": 0.49, "learning_rate": 1.0859563485558266e-05, "loss": 1.2842, "step": 17885 }, { "epoch": 0.49, "learning_rate": 1.0858682248648487e-05, "loss": 1.4131, "step": 17886 }, { "epoch": 0.49, "learning_rate": 1.0857801005020777e-05, "loss": 1.3699, "step": 17887 }, { "epoch": 0.49, "learning_rate": 1.0856919754682037e-05, "loss": 1.2903, "step": 17888 }, { "epoch": 0.49, "learning_rate": 1.085603849763916e-05, "loss": 1.3455, "step": 17889 }, { "epoch": 0.49, "learning_rate": 1.085515723389904e-05, "loss": 1.2471, "step": 17890 }, { "epoch": 0.49, "learning_rate": 1.0854275963468572e-05, "loss": 1.3149, "step": 17891 }, { "epoch": 0.49, "learning_rate": 1.0853394686354653e-05, "loss": 1.3779, "step": 17892 }, { "epoch": 0.49, "learning_rate": 1.085251340256417e-05, "loss": 1.375, "step": 17893 }, { "epoch": 0.49, "learning_rate": 1.0851632112104028e-05, "loss": 1.4563, "step": 17894 }, { "epoch": 0.49, "learning_rate": 1.0850750814981115e-05, "loss": 1.3105, "step": 17895 }, { "epoch": 0.49, "learning_rate": 1.0849869511202328e-05, "loss": 1.2507, "step": 17896 }, { "epoch": 0.49, "learning_rate": 1.0848988200774562e-05, "loss": 1.4358, "step": 17897 }, { "epoch": 0.49, "learning_rate": 1.0848106883704712e-05, "loss": 1.3201, "step": 17898 }, { "epoch": 0.49, "learning_rate": 1.084722555999967e-05, "loss": 1.2515, "step": 17899 }, { "epoch": 0.49, "learning_rate": 1.0846344229666336e-05, "loss": 1.6646, "step": 17900 }, { "epoch": 0.49, "learning_rate": 1.08454628927116e-05, "loss": 1.1379, "step": 17901 }, { "epoch": 0.49, "learning_rate": 1.0844581549142364e-05, "loss": 1.4199, "step": 17902 }, { "epoch": 0.49, "learning_rate": 1.0843700198965514e-05, "loss": 1.1614, "step": 17903 }, { "epoch": 0.49, "learning_rate": 1.0842818842187956e-05, "loss": 1.3069, "step": 17904 }, { "epoch": 0.49, "learning_rate": 1.0841937478816575e-05, "loss": 1.4216, "step": 17905 }, { "epoch": 0.49, "learning_rate": 1.0841056108858272e-05, "loss": 1.3711, "step": 17906 }, { "epoch": 0.49, "learning_rate": 1.0840174732319943e-05, "loss": 1.3052, "step": 17907 }, { "epoch": 0.49, "learning_rate": 1.0839293349208481e-05, "loss": 1.2148, "step": 17908 }, { "epoch": 0.49, "learning_rate": 1.0838411959530786e-05, "loss": 1.2549, "step": 17909 }, { "epoch": 0.49, "learning_rate": 1.0837530563293745e-05, "loss": 1.1946, "step": 17910 }, { "epoch": 0.49, "learning_rate": 1.0836649160504263e-05, "loss": 1.3679, "step": 17911 }, { "epoch": 0.49, "learning_rate": 1.0835767751169226e-05, "loss": 1.2861, "step": 17912 }, { "epoch": 0.49, "learning_rate": 1.083488633529554e-05, "loss": 1.2593, "step": 17913 }, { "epoch": 0.49, "learning_rate": 1.0834004912890092e-05, "loss": 1.3408, "step": 17914 }, { "epoch": 0.49, "learning_rate": 1.0833123483959787e-05, "loss": 1.3301, "step": 17915 }, { "epoch": 0.49, "learning_rate": 1.0832242048511512e-05, "loss": 1.4209, "step": 17916 }, { "epoch": 0.49, "learning_rate": 1.0831360606552169e-05, "loss": 1.1726, "step": 17917 }, { "epoch": 0.49, "learning_rate": 1.0830479158088647e-05, "loss": 1.3044, "step": 17918 }, { "epoch": 0.49, "learning_rate": 1.0829597703127847e-05, "loss": 1.3386, "step": 17919 }, { "epoch": 0.49, "learning_rate": 1.0828716241676666e-05, "loss": 1.252, "step": 17920 }, { "epoch": 0.49, "learning_rate": 1.0827834773742003e-05, "loss": 1.4653, "step": 17921 }, { "epoch": 0.49, "learning_rate": 1.0826953299330745e-05, "loss": 1.3149, "step": 17922 }, { "epoch": 0.49, "learning_rate": 1.0826071818449797e-05, "loss": 1.3965, "step": 17923 }, { "epoch": 0.49, "learning_rate": 1.0825190331106048e-05, "loss": 1.1763, "step": 17924 }, { "epoch": 0.49, "learning_rate": 1.0824308837306401e-05, "loss": 1.3774, "step": 17925 }, { "epoch": 0.49, "learning_rate": 1.0823427337057746e-05, "loss": 1.345, "step": 17926 }, { "epoch": 0.49, "learning_rate": 1.0822545830366986e-05, "loss": 1.2397, "step": 17927 }, { "epoch": 0.49, "learning_rate": 1.0821664317241011e-05, "loss": 1.241, "step": 17928 }, { "epoch": 0.49, "learning_rate": 1.0820782797686724e-05, "loss": 1.3589, "step": 17929 }, { "epoch": 0.49, "learning_rate": 1.0819901271711016e-05, "loss": 1.3313, "step": 17930 }, { "epoch": 0.49, "learning_rate": 1.0819019739320786e-05, "loss": 1.437, "step": 17931 }, { "epoch": 0.49, "learning_rate": 1.0818138200522932e-05, "loss": 1.2305, "step": 17932 }, { "epoch": 0.49, "learning_rate": 1.0817256655324348e-05, "loss": 1.1738, "step": 17933 }, { "epoch": 0.49, "learning_rate": 1.0816375103731933e-05, "loss": 1.3589, "step": 17934 }, { "epoch": 0.49, "learning_rate": 1.0815493545752585e-05, "loss": 1.3955, "step": 17935 }, { "epoch": 0.49, "learning_rate": 1.0814611981393193e-05, "loss": 1.23, "step": 17936 }, { "epoch": 0.49, "learning_rate": 1.0813730410660665e-05, "loss": 1.3108, "step": 17937 }, { "epoch": 0.49, "learning_rate": 1.0812848833561892e-05, "loss": 1.2603, "step": 17938 }, { "epoch": 0.49, "learning_rate": 1.0811967250103771e-05, "loss": 1.1528, "step": 17939 }, { "epoch": 0.49, "learning_rate": 1.0811085660293202e-05, "loss": 1.312, "step": 17940 }, { "epoch": 0.49, "learning_rate": 1.081020406413708e-05, "loss": 1.3381, "step": 17941 }, { "epoch": 0.49, "learning_rate": 1.08093224616423e-05, "loss": 1.3528, "step": 17942 }, { "epoch": 0.49, "learning_rate": 1.0808440852815764e-05, "loss": 1.3411, "step": 17943 }, { "epoch": 0.49, "learning_rate": 1.0807559237664364e-05, "loss": 1.2051, "step": 17944 }, { "epoch": 0.49, "learning_rate": 1.0806677616195005e-05, "loss": 1.1105, "step": 17945 }, { "epoch": 0.49, "learning_rate": 1.0805795988414576e-05, "loss": 1.4194, "step": 17946 }, { "epoch": 0.49, "learning_rate": 1.0804914354329981e-05, "loss": 1.28, "step": 17947 }, { "epoch": 0.49, "learning_rate": 1.0804032713948111e-05, "loss": 1.509, "step": 17948 }, { "epoch": 0.49, "learning_rate": 1.0803151067275869e-05, "loss": 1.3169, "step": 17949 }, { "epoch": 0.49, "learning_rate": 1.080226941432015e-05, "loss": 1.1482, "step": 17950 }, { "epoch": 0.49, "learning_rate": 1.080138775508785e-05, "loss": 1.6997, "step": 17951 }, { "epoch": 0.49, "learning_rate": 1.0800506089585873e-05, "loss": 1.2244, "step": 17952 }, { "epoch": 0.49, "learning_rate": 1.0799624417821114e-05, "loss": 0.9913, "step": 17953 }, { "epoch": 0.49, "learning_rate": 1.0798742739800465e-05, "loss": 1.2935, "step": 17954 }, { "epoch": 0.49, "learning_rate": 1.0797861055530832e-05, "loss": 1.2803, "step": 17955 }, { "epoch": 0.49, "learning_rate": 1.0796979365019107e-05, "loss": 1.2673, "step": 17956 }, { "epoch": 0.49, "learning_rate": 1.0796097668272192e-05, "loss": 1.3542, "step": 17957 }, { "epoch": 0.49, "learning_rate": 1.079521596529698e-05, "loss": 1.4922, "step": 17958 }, { "epoch": 0.49, "learning_rate": 1.0794334256100378e-05, "loss": 1.1331, "step": 17959 }, { "epoch": 0.49, "learning_rate": 1.0793452540689273e-05, "loss": 1.4521, "step": 17960 }, { "epoch": 0.49, "learning_rate": 1.0792570819070572e-05, "loss": 1.3972, "step": 17961 }, { "epoch": 0.49, "learning_rate": 1.0791689091251168e-05, "loss": 1.2498, "step": 17962 }, { "epoch": 0.49, "learning_rate": 1.079080735723796e-05, "loss": 1.3064, "step": 17963 }, { "epoch": 0.49, "learning_rate": 1.0789925617037847e-05, "loss": 1.3892, "step": 17964 }, { "epoch": 0.49, "learning_rate": 1.078904387065773e-05, "loss": 1.2874, "step": 17965 }, { "epoch": 0.49, "learning_rate": 1.0788162118104501e-05, "loss": 1.2424, "step": 17966 }, { "epoch": 0.49, "learning_rate": 1.0787280359385064e-05, "loss": 1.262, "step": 17967 }, { "epoch": 0.49, "learning_rate": 1.0786398594506317e-05, "loss": 1.1797, "step": 17968 }, { "epoch": 0.49, "learning_rate": 1.0785516823475156e-05, "loss": 1.3267, "step": 17969 }, { "epoch": 0.49, "learning_rate": 1.0784635046298481e-05, "loss": 1.2441, "step": 17970 }, { "epoch": 0.49, "learning_rate": 1.078375326298319e-05, "loss": 1.3477, "step": 17971 }, { "epoch": 0.49, "learning_rate": 1.0782871473536184e-05, "loss": 1.4116, "step": 17972 }, { "epoch": 0.49, "learning_rate": 1.0781989677964355e-05, "loss": 1.2798, "step": 17973 }, { "epoch": 0.49, "learning_rate": 1.078110787627461e-05, "loss": 1.2397, "step": 17974 }, { "epoch": 0.49, "learning_rate": 1.0780226068473845e-05, "loss": 1.2153, "step": 17975 }, { "epoch": 0.49, "learning_rate": 1.0779344254568958e-05, "loss": 1.2117, "step": 17976 }, { "epoch": 0.49, "learning_rate": 1.0778462434566845e-05, "loss": 1.2043, "step": 17977 }, { "epoch": 0.49, "learning_rate": 1.0777580608474412e-05, "loss": 1.4976, "step": 17978 }, { "epoch": 0.49, "learning_rate": 1.0776698776298548e-05, "loss": 1.2405, "step": 17979 }, { "epoch": 0.49, "learning_rate": 1.0775816938046165e-05, "loss": 1.2791, "step": 17980 }, { "epoch": 0.49, "learning_rate": 1.077493509372415e-05, "loss": 1.3499, "step": 17981 }, { "epoch": 0.49, "learning_rate": 1.0774053243339408e-05, "loss": 1.3237, "step": 17982 }, { "epoch": 0.49, "learning_rate": 1.0773171386898837e-05, "loss": 1.334, "step": 17983 }, { "epoch": 0.49, "learning_rate": 1.0772289524409341e-05, "loss": 1.3872, "step": 17984 }, { "epoch": 0.49, "learning_rate": 1.077140765587781e-05, "loss": 1.196, "step": 17985 }, { "epoch": 0.49, "learning_rate": 1.0770525781311152e-05, "loss": 1.2319, "step": 17986 }, { "epoch": 0.49, "learning_rate": 1.076964390071626e-05, "loss": 1.3088, "step": 17987 }, { "epoch": 0.49, "learning_rate": 1.0768762014100038e-05, "loss": 1.2751, "step": 17988 }, { "epoch": 0.49, "learning_rate": 1.076788012146938e-05, "loss": 1.377, "step": 17989 }, { "epoch": 0.49, "learning_rate": 1.0766998222831195e-05, "loss": 1.2476, "step": 17990 }, { "epoch": 0.49, "learning_rate": 1.0766116318192372e-05, "loss": 1.3354, "step": 17991 }, { "epoch": 0.49, "learning_rate": 1.0765234407559817e-05, "loss": 1.0394, "step": 17992 }, { "epoch": 0.49, "learning_rate": 1.0764352490940427e-05, "loss": 1.1331, "step": 17993 }, { "epoch": 0.49, "learning_rate": 1.0763470568341104e-05, "loss": 1.2905, "step": 17994 }, { "epoch": 0.49, "learning_rate": 1.0762588639768743e-05, "loss": 1.2805, "step": 17995 }, { "epoch": 0.49, "learning_rate": 1.076170670523025e-05, "loss": 1.3025, "step": 17996 }, { "epoch": 0.49, "learning_rate": 1.076082476473252e-05, "loss": 1.3584, "step": 17997 }, { "epoch": 0.49, "learning_rate": 1.0759942818282454e-05, "loss": 1.3394, "step": 17998 }, { "epoch": 0.49, "learning_rate": 1.0759060865886954e-05, "loss": 1.3457, "step": 17999 }, { "epoch": 0.49, "learning_rate": 1.075817890755292e-05, "loss": 1.3169, "step": 18000 }, { "epoch": 0.49, "learning_rate": 1.0757296943287247e-05, "loss": 1.3491, "step": 18001 }, { "epoch": 0.49, "learning_rate": 1.0756414973096845e-05, "loss": 1.3857, "step": 18002 }, { "epoch": 0.49, "learning_rate": 1.0755532996988602e-05, "loss": 1.3901, "step": 18003 }, { "epoch": 0.49, "learning_rate": 1.0754651014969428e-05, "loss": 1.0857, "step": 18004 }, { "epoch": 0.49, "learning_rate": 1.075376902704622e-05, "loss": 1.2107, "step": 18005 }, { "epoch": 0.49, "learning_rate": 1.0752887033225876e-05, "loss": 1.3894, "step": 18006 }, { "epoch": 0.49, "learning_rate": 1.0752005033515296e-05, "loss": 1.2288, "step": 18007 }, { "epoch": 0.49, "learning_rate": 1.0751123027921385e-05, "loss": 1.2629, "step": 18008 }, { "epoch": 0.49, "learning_rate": 1.0750241016451038e-05, "loss": 1.3594, "step": 18009 }, { "epoch": 0.49, "learning_rate": 1.0749358999111161e-05, "loss": 1.2361, "step": 18010 }, { "epoch": 0.49, "learning_rate": 1.0748476975908647e-05, "loss": 1.2063, "step": 18011 }, { "epoch": 0.49, "learning_rate": 1.0747594946850409e-05, "loss": 1.2114, "step": 18012 }, { "epoch": 0.49, "learning_rate": 1.0746712911943331e-05, "loss": 1.2349, "step": 18013 }, { "epoch": 0.49, "learning_rate": 1.0745830871194327e-05, "loss": 1.3354, "step": 18014 }, { "epoch": 0.49, "learning_rate": 1.0744948824610293e-05, "loss": 1.3328, "step": 18015 }, { "epoch": 0.49, "learning_rate": 1.0744066772198128e-05, "loss": 1.1721, "step": 18016 }, { "epoch": 0.49, "learning_rate": 1.0743184713964736e-05, "loss": 1.0164, "step": 18017 }, { "epoch": 0.49, "learning_rate": 1.0742302649917014e-05, "loss": 1.1794, "step": 18018 }, { "epoch": 0.49, "learning_rate": 1.0741420580061867e-05, "loss": 1.2878, "step": 18019 }, { "epoch": 0.49, "learning_rate": 1.0740538504406193e-05, "loss": 1.366, "step": 18020 }, { "epoch": 0.49, "learning_rate": 1.0739656422956896e-05, "loss": 1.3181, "step": 18021 }, { "epoch": 0.49, "learning_rate": 1.0738774335720873e-05, "loss": 1.2756, "step": 18022 }, { "epoch": 0.49, "learning_rate": 1.0737892242705028e-05, "loss": 1.2874, "step": 18023 }, { "epoch": 0.49, "learning_rate": 1.073701014391626e-05, "loss": 1.2468, "step": 18024 }, { "epoch": 0.49, "learning_rate": 1.0736128039361472e-05, "loss": 1.2192, "step": 18025 }, { "epoch": 0.49, "learning_rate": 1.0735245929047564e-05, "loss": 1.2294, "step": 18026 }, { "epoch": 0.49, "learning_rate": 1.073436381298144e-05, "loss": 1.2656, "step": 18027 }, { "epoch": 0.49, "learning_rate": 1.0733481691169996e-05, "loss": 1.2063, "step": 18028 }, { "epoch": 0.49, "learning_rate": 1.0732599563620136e-05, "loss": 1.3511, "step": 18029 }, { "epoch": 0.49, "learning_rate": 1.0731717430338762e-05, "loss": 1.3208, "step": 18030 }, { "epoch": 0.49, "learning_rate": 1.0730835291332776e-05, "loss": 1.3176, "step": 18031 }, { "epoch": 0.49, "learning_rate": 1.0729953146609076e-05, "loss": 1.3091, "step": 18032 }, { "epoch": 0.49, "learning_rate": 1.0729070996174568e-05, "loss": 1.2983, "step": 18033 }, { "epoch": 0.49, "learning_rate": 1.072818884003615e-05, "loss": 1.4519, "step": 18034 }, { "epoch": 0.49, "learning_rate": 1.0727306678200727e-05, "loss": 1.3652, "step": 18035 }, { "epoch": 0.49, "learning_rate": 1.0726424510675195e-05, "loss": 1.2419, "step": 18036 }, { "epoch": 0.49, "learning_rate": 1.0725542337466463e-05, "loss": 1.1833, "step": 18037 }, { "epoch": 0.49, "learning_rate": 1.0724660158581429e-05, "loss": 1.3511, "step": 18038 }, { "epoch": 0.49, "learning_rate": 1.0723777974026992e-05, "loss": 1.2227, "step": 18039 }, { "epoch": 0.49, "learning_rate": 1.0722895783810057e-05, "loss": 1.2576, "step": 18040 }, { "epoch": 0.49, "learning_rate": 1.0722013587937528e-05, "loss": 1.228, "step": 18041 }, { "epoch": 0.49, "learning_rate": 1.0721131386416301e-05, "loss": 1.3735, "step": 18042 }, { "epoch": 0.49, "learning_rate": 1.0720249179253283e-05, "loss": 1.3079, "step": 18043 }, { "epoch": 0.49, "learning_rate": 1.0719366966455368e-05, "loss": 1.3379, "step": 18044 }, { "epoch": 0.49, "learning_rate": 1.0718484748029472e-05, "loss": 1.3701, "step": 18045 }, { "epoch": 0.49, "learning_rate": 1.0717602523982487e-05, "loss": 1.3682, "step": 18046 }, { "epoch": 0.49, "learning_rate": 1.0716720294321316e-05, "loss": 1.1134, "step": 18047 }, { "epoch": 0.49, "learning_rate": 1.0715838059052863e-05, "loss": 1.3037, "step": 18048 }, { "epoch": 0.49, "learning_rate": 1.0714955818184032e-05, "loss": 1.2166, "step": 18049 }, { "epoch": 0.49, "learning_rate": 1.0714073571721719e-05, "loss": 1.1467, "step": 18050 }, { "epoch": 0.49, "learning_rate": 1.0713191319672833e-05, "loss": 1.2961, "step": 18051 }, { "epoch": 0.49, "learning_rate": 1.0712309062044273e-05, "loss": 1.3547, "step": 18052 }, { "epoch": 0.49, "learning_rate": 1.0711426798842944e-05, "loss": 1.4448, "step": 18053 }, { "epoch": 0.49, "learning_rate": 1.0710544530075741e-05, "loss": 1.4043, "step": 18054 }, { "epoch": 0.49, "learning_rate": 1.0709662255749575e-05, "loss": 1.2424, "step": 18055 }, { "epoch": 0.49, "learning_rate": 1.0708779975871343e-05, "loss": 1.2993, "step": 18056 }, { "epoch": 0.49, "learning_rate": 1.0707897690447953e-05, "loss": 1.1453, "step": 18057 }, { "epoch": 0.49, "learning_rate": 1.0707015399486302e-05, "loss": 1.3147, "step": 18058 }, { "epoch": 0.49, "learning_rate": 1.0706133102993297e-05, "loss": 1.3438, "step": 18059 }, { "epoch": 0.49, "learning_rate": 1.0705250800975838e-05, "loss": 1.386, "step": 18060 }, { "epoch": 0.49, "learning_rate": 1.0704368493440825e-05, "loss": 1.2258, "step": 18061 }, { "epoch": 0.49, "learning_rate": 1.0703486180395168e-05, "loss": 1.1409, "step": 18062 }, { "epoch": 0.49, "learning_rate": 1.0702603861845764e-05, "loss": 1.2551, "step": 18063 }, { "epoch": 0.49, "learning_rate": 1.070172153779952e-05, "loss": 1.2158, "step": 18064 }, { "epoch": 0.49, "learning_rate": 1.0700839208263334e-05, "loss": 1.2371, "step": 18065 }, { "epoch": 0.49, "learning_rate": 1.0699956873244111e-05, "loss": 1.4602, "step": 18066 }, { "epoch": 0.49, "learning_rate": 1.0699074532748756e-05, "loss": 1.3408, "step": 18067 }, { "epoch": 0.49, "learning_rate": 1.069819218678417e-05, "loss": 1.2224, "step": 18068 }, { "epoch": 0.49, "learning_rate": 1.0697309835357262e-05, "loss": 1.1741, "step": 18069 }, { "epoch": 0.49, "learning_rate": 1.0696427478474923e-05, "loss": 1.1423, "step": 18070 }, { "epoch": 0.49, "learning_rate": 1.0695545116144066e-05, "loss": 1.4009, "step": 18071 }, { "epoch": 0.49, "learning_rate": 1.0694662748371589e-05, "loss": 1.229, "step": 18072 }, { "epoch": 0.49, "learning_rate": 1.06937803751644e-05, "loss": 1.2517, "step": 18073 }, { "epoch": 0.49, "learning_rate": 1.0692897996529396e-05, "loss": 1.298, "step": 18074 }, { "epoch": 0.49, "learning_rate": 1.0692015612473486e-05, "loss": 1.2925, "step": 18075 }, { "epoch": 0.49, "learning_rate": 1.0691133223003574e-05, "loss": 1.2808, "step": 18076 }, { "epoch": 0.49, "learning_rate": 1.0690250828126557e-05, "loss": 1.2327, "step": 18077 }, { "epoch": 0.49, "learning_rate": 1.0689368427849342e-05, "loss": 1.3337, "step": 18078 }, { "epoch": 0.49, "learning_rate": 1.0688486022178832e-05, "loss": 1.2307, "step": 18079 }, { "epoch": 0.49, "learning_rate": 1.0687603611121934e-05, "loss": 1.3665, "step": 18080 }, { "epoch": 0.49, "learning_rate": 1.0686721194685547e-05, "loss": 1.405, "step": 18081 }, { "epoch": 0.49, "learning_rate": 1.0685838772876577e-05, "loss": 1.3879, "step": 18082 }, { "epoch": 0.49, "learning_rate": 1.0684956345701927e-05, "loss": 1.3911, "step": 18083 }, { "epoch": 0.49, "learning_rate": 1.0684073913168502e-05, "loss": 1.3091, "step": 18084 }, { "epoch": 0.49, "learning_rate": 1.06831914752832e-05, "loss": 1.1846, "step": 18085 }, { "epoch": 0.49, "learning_rate": 1.0682309032052935e-05, "loss": 1.3198, "step": 18086 }, { "epoch": 0.49, "learning_rate": 1.06814265834846e-05, "loss": 1.1123, "step": 18087 }, { "epoch": 0.49, "learning_rate": 1.0680544129585107e-05, "loss": 1.6179, "step": 18088 }, { "epoch": 0.49, "learning_rate": 1.0679661670361355e-05, "loss": 1.3411, "step": 18089 }, { "epoch": 0.49, "learning_rate": 1.067877920582025e-05, "loss": 1.2632, "step": 18090 }, { "epoch": 0.49, "learning_rate": 1.0677896735968694e-05, "loss": 1.2478, "step": 18091 }, { "epoch": 0.49, "learning_rate": 1.0677014260813596e-05, "loss": 1.3667, "step": 18092 }, { "epoch": 0.49, "learning_rate": 1.0676131780361853e-05, "loss": 1.4089, "step": 18093 }, { "epoch": 0.49, "learning_rate": 1.0675249294620378e-05, "loss": 1.2463, "step": 18094 }, { "epoch": 0.49, "learning_rate": 1.0674366803596065e-05, "loss": 1.249, "step": 18095 }, { "epoch": 0.49, "learning_rate": 1.0673484307295827e-05, "loss": 1.2256, "step": 18096 }, { "epoch": 0.49, "learning_rate": 1.0672601805726562e-05, "loss": 1.3706, "step": 18097 }, { "epoch": 0.49, "learning_rate": 1.0671719298895178e-05, "loss": 1.231, "step": 18098 }, { "epoch": 0.49, "learning_rate": 1.0670836786808576e-05, "loss": 1.2556, "step": 18099 }, { "epoch": 0.49, "learning_rate": 1.0669954269473666e-05, "loss": 1.3872, "step": 18100 }, { "epoch": 0.49, "learning_rate": 1.0669071746897346e-05, "loss": 1.2163, "step": 18101 }, { "epoch": 0.49, "learning_rate": 1.0668189219086526e-05, "loss": 1.1309, "step": 18102 }, { "epoch": 0.49, "learning_rate": 1.0667306686048105e-05, "loss": 1.1863, "step": 18103 }, { "epoch": 0.49, "learning_rate": 1.0666424147788991e-05, "loss": 1.3394, "step": 18104 }, { "epoch": 0.49, "learning_rate": 1.0665541604316087e-05, "loss": 1.2207, "step": 18105 }, { "epoch": 0.49, "learning_rate": 1.06646590556363e-05, "loss": 1.1738, "step": 18106 }, { "epoch": 0.49, "learning_rate": 1.0663776501756531e-05, "loss": 1.1875, "step": 18107 }, { "epoch": 0.49, "learning_rate": 1.066289394268369e-05, "loss": 1.3704, "step": 18108 }, { "epoch": 0.49, "learning_rate": 1.0662011378424677e-05, "loss": 1.2251, "step": 18109 }, { "epoch": 0.49, "learning_rate": 1.06611288089864e-05, "loss": 1.3748, "step": 18110 }, { "epoch": 0.49, "learning_rate": 1.0660246234375757e-05, "loss": 1.2424, "step": 18111 }, { "epoch": 0.49, "learning_rate": 1.0659363654599664e-05, "loss": 1.4624, "step": 18112 }, { "epoch": 0.49, "learning_rate": 1.0658481069665017e-05, "loss": 1.4104, "step": 18113 }, { "epoch": 0.49, "learning_rate": 1.0657598479578724e-05, "loss": 1.3496, "step": 18114 }, { "epoch": 0.49, "learning_rate": 1.0656715884347688e-05, "loss": 1.5454, "step": 18115 }, { "epoch": 0.49, "learning_rate": 1.0655833283978818e-05, "loss": 1.2446, "step": 18116 }, { "epoch": 0.49, "learning_rate": 1.0654950678479015e-05, "loss": 1.3694, "step": 18117 }, { "epoch": 0.49, "learning_rate": 1.0654068067855187e-05, "loss": 1.3799, "step": 18118 }, { "epoch": 0.49, "learning_rate": 1.065318545211424e-05, "loss": 1.2559, "step": 18119 }, { "epoch": 0.49, "learning_rate": 1.0652302831263074e-05, "loss": 1.2434, "step": 18120 }, { "epoch": 0.49, "learning_rate": 1.0651420205308598e-05, "loss": 1.4539, "step": 18121 }, { "epoch": 0.49, "learning_rate": 1.0650537574257718e-05, "loss": 1.2935, "step": 18122 }, { "epoch": 0.49, "learning_rate": 1.0649654938117337e-05, "loss": 1.1584, "step": 18123 }, { "epoch": 0.49, "learning_rate": 1.064877229689436e-05, "loss": 1.3477, "step": 18124 }, { "epoch": 0.49, "learning_rate": 1.0647889650595695e-05, "loss": 1.2659, "step": 18125 }, { "epoch": 0.5, "learning_rate": 1.0647006999228247e-05, "loss": 1.2317, "step": 18126 }, { "epoch": 0.5, "learning_rate": 1.064612434279892e-05, "loss": 1.2065, "step": 18127 }, { "epoch": 0.5, "learning_rate": 1.0645241681314617e-05, "loss": 1.322, "step": 18128 }, { "epoch": 0.5, "learning_rate": 1.064435901478225e-05, "loss": 1.3489, "step": 18129 }, { "epoch": 0.5, "learning_rate": 1.0643476343208721e-05, "loss": 1.3563, "step": 18130 }, { "epoch": 0.5, "learning_rate": 1.0642593666600936e-05, "loss": 1.2834, "step": 18131 }, { "epoch": 0.5, "learning_rate": 1.0641710984965796e-05, "loss": 1.2793, "step": 18132 }, { "epoch": 0.5, "learning_rate": 1.0640828298310218e-05, "loss": 1.3499, "step": 18133 }, { "epoch": 0.5, "learning_rate": 1.0639945606641093e-05, "loss": 1.4248, "step": 18134 }, { "epoch": 0.5, "learning_rate": 1.0639062909965341e-05, "loss": 1.3376, "step": 18135 }, { "epoch": 0.5, "learning_rate": 1.0638180208289857e-05, "loss": 1.3911, "step": 18136 }, { "epoch": 0.5, "learning_rate": 1.063729750162155e-05, "loss": 1.1721, "step": 18137 }, { "epoch": 0.5, "learning_rate": 1.0636414789967332e-05, "loss": 1.2954, "step": 18138 }, { "epoch": 0.5, "learning_rate": 1.0635532073334101e-05, "loss": 1.2795, "step": 18139 }, { "epoch": 0.5, "learning_rate": 1.0634649351728765e-05, "loss": 1.291, "step": 18140 }, { "epoch": 0.5, "learning_rate": 1.0633766625158235e-05, "loss": 1.28, "step": 18141 }, { "epoch": 0.5, "learning_rate": 1.0632883893629408e-05, "loss": 1.4316, "step": 18142 }, { "epoch": 0.5, "learning_rate": 1.0632001157149198e-05, "loss": 1.3499, "step": 18143 }, { "epoch": 0.5, "learning_rate": 1.0631118415724509e-05, "loss": 1.231, "step": 18144 }, { "epoch": 0.5, "learning_rate": 1.0630235669362245e-05, "loss": 1.2451, "step": 18145 }, { "epoch": 0.5, "learning_rate": 1.0629352918069312e-05, "loss": 1.3755, "step": 18146 }, { "epoch": 0.5, "learning_rate": 1.062847016185262e-05, "loss": 1.1985, "step": 18147 }, { "epoch": 0.5, "learning_rate": 1.062758740071907e-05, "loss": 1.345, "step": 18148 }, { "epoch": 0.5, "learning_rate": 1.0626704634675576e-05, "loss": 1.3372, "step": 18149 }, { "epoch": 0.5, "learning_rate": 1.0625821863729036e-05, "loss": 1.3413, "step": 18150 }, { "epoch": 0.5, "learning_rate": 1.062493908788636e-05, "loss": 1.2505, "step": 18151 }, { "epoch": 0.5, "learning_rate": 1.0624056307154455e-05, "loss": 1.3826, "step": 18152 }, { "epoch": 0.5, "learning_rate": 1.0623173521540227e-05, "loss": 1.4033, "step": 18153 }, { "epoch": 0.5, "learning_rate": 1.0622290731050582e-05, "loss": 1.2781, "step": 18154 }, { "epoch": 0.5, "learning_rate": 1.062140793569243e-05, "loss": 1.335, "step": 18155 }, { "epoch": 0.5, "learning_rate": 1.062052513547267e-05, "loss": 1.3701, "step": 18156 }, { "epoch": 0.5, "learning_rate": 1.0619642330398217e-05, "loss": 1.3723, "step": 18157 }, { "epoch": 0.5, "learning_rate": 1.061875952047597e-05, "loss": 1.345, "step": 18158 }, { "epoch": 0.5, "learning_rate": 1.0617876705712844e-05, "loss": 1.3459, "step": 18159 }, { "epoch": 0.5, "learning_rate": 1.0616993886115736e-05, "loss": 1.2662, "step": 18160 }, { "epoch": 0.5, "learning_rate": 1.0616111061691563e-05, "loss": 1.2979, "step": 18161 }, { "epoch": 0.5, "learning_rate": 1.0615228232447223e-05, "loss": 1.2483, "step": 18162 }, { "epoch": 0.5, "learning_rate": 1.061434539838963e-05, "loss": 1.4163, "step": 18163 }, { "epoch": 0.5, "learning_rate": 1.0613462559525684e-05, "loss": 1.3586, "step": 18164 }, { "epoch": 0.5, "learning_rate": 1.0612579715862299e-05, "loss": 1.2178, "step": 18165 }, { "epoch": 0.5, "learning_rate": 1.0611696867406374e-05, "loss": 1.3538, "step": 18166 }, { "epoch": 0.5, "learning_rate": 1.0610814014164825e-05, "loss": 1.2222, "step": 18167 }, { "epoch": 0.5, "learning_rate": 1.060993115614455e-05, "loss": 1.3481, "step": 18168 }, { "epoch": 0.5, "learning_rate": 1.0609048293352462e-05, "loss": 1.2305, "step": 18169 }, { "epoch": 0.5, "learning_rate": 1.0608165425795469e-05, "loss": 1.4722, "step": 18170 }, { "epoch": 0.5, "learning_rate": 1.060728255348047e-05, "loss": 1.356, "step": 18171 }, { "epoch": 0.5, "learning_rate": 1.0606399676414385e-05, "loss": 1.3967, "step": 18172 }, { "epoch": 0.5, "learning_rate": 1.0605516794604109e-05, "loss": 1.2617, "step": 18173 }, { "epoch": 0.5, "learning_rate": 1.0604633908056559e-05, "loss": 1.2502, "step": 18174 }, { "epoch": 0.5, "learning_rate": 1.0603751016778631e-05, "loss": 1.238, "step": 18175 }, { "epoch": 0.5, "learning_rate": 1.0602868120777246e-05, "loss": 1.3428, "step": 18176 }, { "epoch": 0.5, "learning_rate": 1.0601985220059299e-05, "loss": 1.6982, "step": 18177 }, { "epoch": 0.5, "learning_rate": 1.0601102314631706e-05, "loss": 1.1765, "step": 18178 }, { "epoch": 0.5, "learning_rate": 1.060021940450137e-05, "loss": 1.1492, "step": 18179 }, { "epoch": 0.5, "learning_rate": 1.0599336489675199e-05, "loss": 1.2747, "step": 18180 }, { "epoch": 0.5, "learning_rate": 1.0598453570160101e-05, "loss": 1.4341, "step": 18181 }, { "epoch": 0.5, "learning_rate": 1.0597570645962982e-05, "loss": 1.366, "step": 18182 }, { "epoch": 0.5, "learning_rate": 1.0596687717090755e-05, "loss": 1.8447, "step": 18183 }, { "epoch": 0.5, "learning_rate": 1.059580478355032e-05, "loss": 1.3259, "step": 18184 }, { "epoch": 0.5, "learning_rate": 1.0594921845348592e-05, "loss": 1.3301, "step": 18185 }, { "epoch": 0.5, "learning_rate": 1.0594038902492475e-05, "loss": 1.3752, "step": 18186 }, { "epoch": 0.5, "learning_rate": 1.0593155954988874e-05, "loss": 1.3674, "step": 18187 }, { "epoch": 0.5, "learning_rate": 1.0592273002844704e-05, "loss": 1.3628, "step": 18188 }, { "epoch": 0.5, "learning_rate": 1.0591390046066865e-05, "loss": 1.3076, "step": 18189 }, { "epoch": 0.5, "learning_rate": 1.0590507084662272e-05, "loss": 1.3496, "step": 18190 }, { "epoch": 0.5, "learning_rate": 1.0589624118637825e-05, "loss": 1.2039, "step": 18191 }, { "epoch": 0.5, "learning_rate": 1.0588741148000438e-05, "loss": 1.1592, "step": 18192 }, { "epoch": 0.5, "learning_rate": 1.0587858172757017e-05, "loss": 1.3828, "step": 18193 }, { "epoch": 0.5, "learning_rate": 1.0586975192914473e-05, "loss": 1.3394, "step": 18194 }, { "epoch": 0.5, "learning_rate": 1.0586092208479706e-05, "loss": 1.043, "step": 18195 }, { "epoch": 0.5, "learning_rate": 1.0585209219459633e-05, "loss": 1.3638, "step": 18196 }, { "epoch": 0.5, "learning_rate": 1.0584326225861157e-05, "loss": 1.2666, "step": 18197 }, { "epoch": 0.5, "learning_rate": 1.0583443227691188e-05, "loss": 1.2529, "step": 18198 }, { "epoch": 0.5, "learning_rate": 1.0582560224956628e-05, "loss": 1.2393, "step": 18199 }, { "epoch": 0.5, "learning_rate": 1.0581677217664397e-05, "loss": 1.3579, "step": 18200 }, { "epoch": 0.5, "learning_rate": 1.0580794205821397e-05, "loss": 1.2566, "step": 18201 }, { "epoch": 0.5, "learning_rate": 1.0579911189434535e-05, "loss": 1.168, "step": 18202 }, { "epoch": 0.5, "learning_rate": 1.0579028168510718e-05, "loss": 1.2959, "step": 18203 }, { "epoch": 0.5, "learning_rate": 1.0578145143056861e-05, "loss": 1.2896, "step": 18204 }, { "epoch": 0.5, "learning_rate": 1.0577262113079865e-05, "loss": 1.2031, "step": 18205 }, { "epoch": 0.5, "learning_rate": 1.0576379078586645e-05, "loss": 1.3616, "step": 18206 }, { "epoch": 0.5, "learning_rate": 1.0575496039584104e-05, "loss": 1.3984, "step": 18207 }, { "epoch": 0.5, "learning_rate": 1.0574612996079151e-05, "loss": 1.1936, "step": 18208 }, { "epoch": 0.5, "learning_rate": 1.0573729948078699e-05, "loss": 1.3652, "step": 18209 }, { "epoch": 0.5, "learning_rate": 1.0572846895589652e-05, "loss": 1.3176, "step": 18210 }, { "epoch": 0.5, "learning_rate": 1.0571963838618922e-05, "loss": 1.248, "step": 18211 }, { "epoch": 0.5, "learning_rate": 1.0571080777173415e-05, "loss": 1.4126, "step": 18212 }, { "epoch": 0.5, "learning_rate": 1.057019771126004e-05, "loss": 1.416, "step": 18213 }, { "epoch": 0.5, "learning_rate": 1.0569314640885706e-05, "loss": 1.3079, "step": 18214 }, { "epoch": 0.5, "learning_rate": 1.056843156605732e-05, "loss": 1.853, "step": 18215 }, { "epoch": 0.5, "learning_rate": 1.0567548486781796e-05, "loss": 1.1775, "step": 18216 }, { "epoch": 0.5, "learning_rate": 1.0566665403066038e-05, "loss": 1.1956, "step": 18217 }, { "epoch": 0.5, "learning_rate": 1.0565782314916959e-05, "loss": 1.3494, "step": 18218 }, { "epoch": 0.5, "learning_rate": 1.0564899222341463e-05, "loss": 1.2227, "step": 18219 }, { "epoch": 0.5, "learning_rate": 1.0564016125346461e-05, "loss": 1.3809, "step": 18220 }, { "epoch": 0.5, "learning_rate": 1.0563133023938863e-05, "loss": 1.3574, "step": 18221 }, { "epoch": 0.5, "learning_rate": 1.0562249918125575e-05, "loss": 1.3301, "step": 18222 }, { "epoch": 0.5, "learning_rate": 1.0561366807913509e-05, "loss": 1.293, "step": 18223 }, { "epoch": 0.5, "learning_rate": 1.0560483693309576e-05, "loss": 1.1323, "step": 18224 }, { "epoch": 0.5, "learning_rate": 1.055960057432068e-05, "loss": 1.3005, "step": 18225 }, { "epoch": 0.5, "learning_rate": 1.0558717450953733e-05, "loss": 1.2197, "step": 18226 }, { "epoch": 0.5, "learning_rate": 1.055783432321564e-05, "loss": 1.2703, "step": 18227 }, { "epoch": 0.5, "learning_rate": 1.0556951191113316e-05, "loss": 1.3499, "step": 18228 }, { "epoch": 0.5, "learning_rate": 1.0556068054653667e-05, "loss": 1.0896, "step": 18229 }, { "epoch": 0.5, "learning_rate": 1.0555184913843604e-05, "loss": 1.2634, "step": 18230 }, { "epoch": 0.5, "learning_rate": 1.0554301768690036e-05, "loss": 1.1838, "step": 18231 }, { "epoch": 0.5, "learning_rate": 1.0553418619199869e-05, "loss": 1.2422, "step": 18232 }, { "epoch": 0.5, "learning_rate": 1.0552535465380018e-05, "loss": 1.332, "step": 18233 }, { "epoch": 0.5, "learning_rate": 1.0551652307237388e-05, "loss": 1.2876, "step": 18234 }, { "epoch": 0.5, "learning_rate": 1.0550769144778889e-05, "loss": 1.2588, "step": 18235 }, { "epoch": 0.5, "learning_rate": 1.0549885978011432e-05, "loss": 1.4365, "step": 18236 }, { "epoch": 0.5, "learning_rate": 1.0549002806941926e-05, "loss": 1.2961, "step": 18237 }, { "epoch": 0.5, "learning_rate": 1.0548119631577278e-05, "loss": 1.1738, "step": 18238 }, { "epoch": 0.5, "learning_rate": 1.0547236451924403e-05, "loss": 1.1528, "step": 18239 }, { "epoch": 0.5, "learning_rate": 1.0546353267990206e-05, "loss": 1.1638, "step": 18240 }, { "epoch": 0.5, "learning_rate": 1.0545470079781598e-05, "loss": 1.2664, "step": 18241 }, { "epoch": 0.5, "learning_rate": 1.0544586887305489e-05, "loss": 1.314, "step": 18242 }, { "epoch": 0.5, "learning_rate": 1.0543703690568788e-05, "loss": 1.3274, "step": 18243 }, { "epoch": 0.5, "learning_rate": 1.0542820489578404e-05, "loss": 1.304, "step": 18244 }, { "epoch": 0.5, "learning_rate": 1.054193728434125e-05, "loss": 1.2771, "step": 18245 }, { "epoch": 0.5, "learning_rate": 1.0541054074864228e-05, "loss": 1.344, "step": 18246 }, { "epoch": 0.5, "learning_rate": 1.0540170861154258e-05, "loss": 1.3401, "step": 18247 }, { "epoch": 0.5, "learning_rate": 1.0539287643218243e-05, "loss": 1.2123, "step": 18248 }, { "epoch": 0.5, "learning_rate": 1.05384044210631e-05, "loss": 1.2236, "step": 18249 }, { "epoch": 0.5, "learning_rate": 1.0537521194695728e-05, "loss": 1.365, "step": 18250 }, { "epoch": 0.5, "learning_rate": 1.0536637964123046e-05, "loss": 1.1741, "step": 18251 }, { "epoch": 0.5, "learning_rate": 1.0535754729351959e-05, "loss": 1.3718, "step": 18252 }, { "epoch": 0.5, "learning_rate": 1.0534871490389383e-05, "loss": 1.3496, "step": 18253 }, { "epoch": 0.5, "learning_rate": 1.0533988247242219e-05, "loss": 1.6987, "step": 18254 }, { "epoch": 0.5, "learning_rate": 1.0533104999917387e-05, "loss": 1.271, "step": 18255 }, { "epoch": 0.5, "learning_rate": 1.0532221748421786e-05, "loss": 1.2261, "step": 18256 }, { "epoch": 0.5, "learning_rate": 1.053133849276234e-05, "loss": 1.3386, "step": 18257 }, { "epoch": 0.5, "learning_rate": 1.0530455232945945e-05, "loss": 1.4087, "step": 18258 }, { "epoch": 0.5, "learning_rate": 1.0529571968979522e-05, "loss": 1.2898, "step": 18259 }, { "epoch": 0.5, "learning_rate": 1.0528688700869974e-05, "loss": 1.3884, "step": 18260 }, { "epoch": 0.5, "learning_rate": 1.0527805428624214e-05, "loss": 1.4409, "step": 18261 }, { "epoch": 0.5, "learning_rate": 1.0526922152249152e-05, "loss": 1.3372, "step": 18262 }, { "epoch": 0.5, "learning_rate": 1.05260388717517e-05, "loss": 1.3501, "step": 18263 }, { "epoch": 0.5, "learning_rate": 1.0525155587138769e-05, "loss": 1.4509, "step": 18264 }, { "epoch": 0.5, "learning_rate": 1.0524272298417266e-05, "loss": 1.2375, "step": 18265 }, { "epoch": 0.5, "learning_rate": 1.0523389005594102e-05, "loss": 1.2014, "step": 18266 }, { "epoch": 0.5, "learning_rate": 1.0522505708676192e-05, "loss": 1.3411, "step": 18267 }, { "epoch": 0.5, "learning_rate": 1.052162240767044e-05, "loss": 1.3062, "step": 18268 }, { "epoch": 0.5, "learning_rate": 1.0520739102583761e-05, "loss": 1.1311, "step": 18269 }, { "epoch": 0.5, "learning_rate": 1.0519855793423064e-05, "loss": 1.2085, "step": 18270 }, { "epoch": 0.5, "learning_rate": 1.051897248019526e-05, "loss": 1.3789, "step": 18271 }, { "epoch": 0.5, "learning_rate": 1.0518089162907257e-05, "loss": 1.3704, "step": 18272 }, { "epoch": 0.5, "learning_rate": 1.0517205841565972e-05, "loss": 1.4028, "step": 18273 }, { "epoch": 0.5, "learning_rate": 1.0516322516178308e-05, "loss": 1.2847, "step": 18274 }, { "epoch": 0.5, "learning_rate": 1.0515439186751182e-05, "loss": 1.3501, "step": 18275 }, { "epoch": 0.5, "learning_rate": 1.0514555853291499e-05, "loss": 1.292, "step": 18276 }, { "epoch": 0.5, "learning_rate": 1.0513672515806174e-05, "loss": 1.2913, "step": 18277 }, { "epoch": 0.5, "learning_rate": 1.051278917430212e-05, "loss": 1.3328, "step": 18278 }, { "epoch": 0.5, "learning_rate": 1.0511905828786242e-05, "loss": 1.2441, "step": 18279 }, { "epoch": 0.5, "learning_rate": 1.0511022479265456e-05, "loss": 1.2788, "step": 18280 }, { "epoch": 0.5, "learning_rate": 1.0510139125746665e-05, "loss": 1.3455, "step": 18281 }, { "epoch": 0.5, "learning_rate": 1.0509255768236792e-05, "loss": 1.2617, "step": 18282 }, { "epoch": 0.5, "learning_rate": 1.0508372406742737e-05, "loss": 1.2302, "step": 18283 }, { "epoch": 0.5, "learning_rate": 1.0507489041271417e-05, "loss": 1.2717, "step": 18284 }, { "epoch": 0.5, "learning_rate": 1.050660567182974e-05, "loss": 1.2607, "step": 18285 }, { "epoch": 0.5, "learning_rate": 1.050572229842462e-05, "loss": 1.2847, "step": 18286 }, { "epoch": 0.5, "learning_rate": 1.0504838921062965e-05, "loss": 1.2793, "step": 18287 }, { "epoch": 0.5, "learning_rate": 1.050395553975169e-05, "loss": 1.2371, "step": 18288 }, { "epoch": 0.5, "learning_rate": 1.0503072154497703e-05, "loss": 1.3772, "step": 18289 }, { "epoch": 0.5, "learning_rate": 1.0502188765307915e-05, "loss": 1.3289, "step": 18290 }, { "epoch": 0.5, "learning_rate": 1.0501305372189236e-05, "loss": 1.1926, "step": 18291 }, { "epoch": 0.5, "learning_rate": 1.0500421975148582e-05, "loss": 1.6924, "step": 18292 }, { "epoch": 0.5, "learning_rate": 1.049953857419286e-05, "loss": 1.293, "step": 18293 }, { "epoch": 0.5, "learning_rate": 1.0498655169328986e-05, "loss": 1.2458, "step": 18294 }, { "epoch": 0.5, "learning_rate": 1.0497771760563869e-05, "loss": 1.3181, "step": 18295 }, { "epoch": 0.5, "learning_rate": 1.0496888347904417e-05, "loss": 1.1899, "step": 18296 }, { "epoch": 0.5, "learning_rate": 1.0496004931357545e-05, "loss": 1.2058, "step": 18297 }, { "epoch": 0.5, "learning_rate": 1.0495121510930167e-05, "loss": 1.261, "step": 18298 }, { "epoch": 0.5, "learning_rate": 1.0494238086629184e-05, "loss": 1.7085, "step": 18299 }, { "epoch": 0.5, "learning_rate": 1.049335465846152e-05, "loss": 1.3308, "step": 18300 }, { "epoch": 0.5, "learning_rate": 1.049247122643408e-05, "loss": 1.3755, "step": 18301 }, { "epoch": 0.5, "learning_rate": 1.0491587790553779e-05, "loss": 1.4004, "step": 18302 }, { "epoch": 0.5, "learning_rate": 1.0490704350827523e-05, "loss": 1.3987, "step": 18303 }, { "epoch": 0.5, "learning_rate": 1.048982090726223e-05, "loss": 1.3411, "step": 18304 }, { "epoch": 0.5, "learning_rate": 1.0488937459864804e-05, "loss": 1.3206, "step": 18305 }, { "epoch": 0.5, "learning_rate": 1.0488054008642165e-05, "loss": 1.3237, "step": 18306 }, { "epoch": 0.5, "learning_rate": 1.0487170553601218e-05, "loss": 1.2783, "step": 18307 }, { "epoch": 0.5, "learning_rate": 1.048628709474888e-05, "loss": 1.4026, "step": 18308 }, { "epoch": 0.5, "learning_rate": 1.0485403632092056e-05, "loss": 1.3928, "step": 18309 }, { "epoch": 0.5, "learning_rate": 1.0484520165637668e-05, "loss": 1.3435, "step": 18310 }, { "epoch": 0.5, "learning_rate": 1.0483636695392619e-05, "loss": 1.2551, "step": 18311 }, { "epoch": 0.5, "learning_rate": 1.0482753221363826e-05, "loss": 1.4224, "step": 18312 }, { "epoch": 0.5, "learning_rate": 1.0481869743558197e-05, "loss": 1.3752, "step": 18313 }, { "epoch": 0.5, "learning_rate": 1.0480986261982649e-05, "loss": 1.2969, "step": 18314 }, { "epoch": 0.5, "learning_rate": 1.0480102776644086e-05, "loss": 1.2529, "step": 18315 }, { "epoch": 0.5, "learning_rate": 1.0479219287549427e-05, "loss": 1.1846, "step": 18316 }, { "epoch": 0.5, "learning_rate": 1.0478335794705581e-05, "loss": 1.2534, "step": 18317 }, { "epoch": 0.5, "learning_rate": 1.0477452298119461e-05, "loss": 1.1758, "step": 18318 }, { "epoch": 0.5, "learning_rate": 1.047656879779798e-05, "loss": 1.1259, "step": 18319 }, { "epoch": 0.5, "learning_rate": 1.0475685293748047e-05, "loss": 1.4426, "step": 18320 }, { "epoch": 0.5, "learning_rate": 1.0474801785976576e-05, "loss": 1.283, "step": 18321 }, { "epoch": 0.5, "learning_rate": 1.0473918274490482e-05, "loss": 1.3438, "step": 18322 }, { "epoch": 0.5, "learning_rate": 1.0473034759296669e-05, "loss": 1.301, "step": 18323 }, { "epoch": 0.5, "learning_rate": 1.0472151240402057e-05, "loss": 1.134, "step": 18324 }, { "epoch": 0.5, "learning_rate": 1.0471267717813559e-05, "loss": 1.228, "step": 18325 }, { "epoch": 0.5, "learning_rate": 1.0470384191538078e-05, "loss": 0.9824, "step": 18326 }, { "epoch": 0.5, "learning_rate": 1.0469500661582536e-05, "loss": 1.2288, "step": 18327 }, { "epoch": 0.5, "learning_rate": 1.0468617127953842e-05, "loss": 1.3872, "step": 18328 }, { "epoch": 0.5, "learning_rate": 1.0467733590658907e-05, "loss": 1.1714, "step": 18329 }, { "epoch": 0.5, "learning_rate": 1.0466850049704645e-05, "loss": 1.2937, "step": 18330 }, { "epoch": 0.5, "learning_rate": 1.0465966505097964e-05, "loss": 1.3425, "step": 18331 }, { "epoch": 0.5, "learning_rate": 1.0465082956845785e-05, "loss": 1.3345, "step": 18332 }, { "epoch": 0.5, "learning_rate": 1.0464199404955013e-05, "loss": 1.3547, "step": 18333 }, { "epoch": 0.5, "learning_rate": 1.0463315849432564e-05, "loss": 1.1018, "step": 18334 }, { "epoch": 0.5, "learning_rate": 1.046243229028535e-05, "loss": 1.7759, "step": 18335 }, { "epoch": 0.5, "learning_rate": 1.0461548727520282e-05, "loss": 1.3052, "step": 18336 }, { "epoch": 0.5, "learning_rate": 1.0460665161144275e-05, "loss": 1.7183, "step": 18337 }, { "epoch": 0.5, "learning_rate": 1.045978159116424e-05, "loss": 1.2861, "step": 18338 }, { "epoch": 0.5, "learning_rate": 1.045889801758709e-05, "loss": 1.2195, "step": 18339 }, { "epoch": 0.5, "learning_rate": 1.0458014440419737e-05, "loss": 1.2437, "step": 18340 }, { "epoch": 0.5, "learning_rate": 1.0457130859669095e-05, "loss": 1.2654, "step": 18341 }, { "epoch": 0.5, "learning_rate": 1.0456247275342075e-05, "loss": 1.2639, "step": 18342 }, { "epoch": 0.5, "learning_rate": 1.0455363687445594e-05, "loss": 1.354, "step": 18343 }, { "epoch": 0.5, "learning_rate": 1.045448009598656e-05, "loss": 1.2004, "step": 18344 }, { "epoch": 0.5, "learning_rate": 1.0453596500971887e-05, "loss": 1.1843, "step": 18345 }, { "epoch": 0.5, "learning_rate": 1.0452712902408489e-05, "loss": 1.3594, "step": 18346 }, { "epoch": 0.5, "learning_rate": 1.0451829300303278e-05, "loss": 1.3101, "step": 18347 }, { "epoch": 0.5, "learning_rate": 1.0450945694663167e-05, "loss": 1.2153, "step": 18348 }, { "epoch": 0.5, "learning_rate": 1.0450062085495067e-05, "loss": 1.3184, "step": 18349 }, { "epoch": 0.5, "learning_rate": 1.0449178472805895e-05, "loss": 1.1091, "step": 18350 }, { "epoch": 0.5, "learning_rate": 1.0448294856602561e-05, "loss": 1.1638, "step": 18351 }, { "epoch": 0.5, "learning_rate": 1.0447411236891977e-05, "loss": 1.3733, "step": 18352 }, { "epoch": 0.5, "learning_rate": 1.0446527613681064e-05, "loss": 1.2971, "step": 18353 }, { "epoch": 0.5, "learning_rate": 1.0445643986976722e-05, "loss": 1.3101, "step": 18354 }, { "epoch": 0.5, "learning_rate": 1.0444760356785874e-05, "loss": 1.3582, "step": 18355 }, { "epoch": 0.5, "learning_rate": 1.044387672311543e-05, "loss": 1.1919, "step": 18356 }, { "epoch": 0.5, "learning_rate": 1.0442993085972303e-05, "loss": 1.2639, "step": 18357 }, { "epoch": 0.5, "learning_rate": 1.0442109445363406e-05, "loss": 1.3643, "step": 18358 }, { "epoch": 0.5, "learning_rate": 1.0441225801295654e-05, "loss": 1.238, "step": 18359 }, { "epoch": 0.5, "learning_rate": 1.0440342153775957e-05, "loss": 0.998, "step": 18360 }, { "epoch": 0.5, "learning_rate": 1.0439458502811233e-05, "loss": 1.3062, "step": 18361 }, { "epoch": 0.5, "learning_rate": 1.0438574848408389e-05, "loss": 1.3667, "step": 18362 }, { "epoch": 0.5, "learning_rate": 1.0437691190574345e-05, "loss": 1.0803, "step": 18363 }, { "epoch": 0.5, "learning_rate": 1.0436807529316007e-05, "loss": 1.3047, "step": 18364 }, { "epoch": 0.5, "learning_rate": 1.0435923864640296e-05, "loss": 1.3296, "step": 18365 }, { "epoch": 0.5, "learning_rate": 1.0435040196554118e-05, "loss": 1.28, "step": 18366 }, { "epoch": 0.5, "learning_rate": 1.0434156525064395e-05, "loss": 1.1709, "step": 18367 }, { "epoch": 0.5, "learning_rate": 1.043327285017803e-05, "loss": 1.261, "step": 18368 }, { "epoch": 0.5, "learning_rate": 1.0432389171901947e-05, "loss": 1.4331, "step": 18369 }, { "epoch": 0.5, "learning_rate": 1.0431505490243048e-05, "loss": 1.3564, "step": 18370 }, { "epoch": 0.5, "learning_rate": 1.0430621805208258e-05, "loss": 1.1445, "step": 18371 }, { "epoch": 0.5, "learning_rate": 1.0429738116804481e-05, "loss": 1.2991, "step": 18372 }, { "epoch": 0.5, "learning_rate": 1.0428854425038641e-05, "loss": 1.2839, "step": 18373 }, { "epoch": 0.5, "learning_rate": 1.0427970729917642e-05, "loss": 1.3352, "step": 18374 }, { "epoch": 0.5, "learning_rate": 1.0427087031448404e-05, "loss": 1.334, "step": 18375 }, { "epoch": 0.5, "learning_rate": 1.0426203329637837e-05, "loss": 1.219, "step": 18376 }, { "epoch": 0.5, "learning_rate": 1.0425319624492854e-05, "loss": 1.2712, "step": 18377 }, { "epoch": 0.5, "learning_rate": 1.042443591602037e-05, "loss": 1.2219, "step": 18378 }, { "epoch": 0.5, "learning_rate": 1.04235522042273e-05, "loss": 1.2917, "step": 18379 }, { "epoch": 0.5, "learning_rate": 1.0422668489120558e-05, "loss": 1.105, "step": 18380 }, { "epoch": 0.5, "learning_rate": 1.0421784770707056e-05, "loss": 1.3165, "step": 18381 }, { "epoch": 0.5, "learning_rate": 1.0420901048993705e-05, "loss": 1.439, "step": 18382 }, { "epoch": 0.5, "learning_rate": 1.0420017323987426e-05, "loss": 1.2681, "step": 18383 }, { "epoch": 0.5, "learning_rate": 1.0419133595695128e-05, "loss": 1.3577, "step": 18384 }, { "epoch": 0.5, "learning_rate": 1.0418249864123724e-05, "loss": 1.272, "step": 18385 }, { "epoch": 0.5, "learning_rate": 1.0417366129280133e-05, "loss": 1.2991, "step": 18386 }, { "epoch": 0.5, "learning_rate": 1.041648239117126e-05, "loss": 1.4546, "step": 18387 }, { "epoch": 0.5, "learning_rate": 1.0415598649804031e-05, "loss": 1.2239, "step": 18388 }, { "epoch": 0.5, "learning_rate": 1.0414714905185351e-05, "loss": 1.3601, "step": 18389 }, { "epoch": 0.5, "learning_rate": 1.0413831157322138e-05, "loss": 1.3596, "step": 18390 }, { "epoch": 0.5, "learning_rate": 1.0412947406221301e-05, "loss": 1.395, "step": 18391 }, { "epoch": 0.5, "learning_rate": 1.0412063651889762e-05, "loss": 1.3054, "step": 18392 }, { "epoch": 0.5, "learning_rate": 1.0411179894334427e-05, "loss": 1.4792, "step": 18393 }, { "epoch": 0.5, "learning_rate": 1.0410296133562217e-05, "loss": 1.3081, "step": 18394 }, { "epoch": 0.5, "learning_rate": 1.0409412369580041e-05, "loss": 1.2837, "step": 18395 }, { "epoch": 0.5, "learning_rate": 1.0408528602394816e-05, "loss": 1.4426, "step": 18396 }, { "epoch": 0.5, "learning_rate": 1.0407644832013454e-05, "loss": 1.2937, "step": 18397 }, { "epoch": 0.5, "learning_rate": 1.0406761058442873e-05, "loss": 1.2773, "step": 18398 }, { "epoch": 0.5, "learning_rate": 1.0405877281689982e-05, "loss": 1.3313, "step": 18399 }, { "epoch": 0.5, "learning_rate": 1.04049935017617e-05, "loss": 1.2603, "step": 18400 }, { "epoch": 0.5, "learning_rate": 1.0404109718664937e-05, "loss": 1.3218, "step": 18401 }, { "epoch": 0.5, "learning_rate": 1.0403225932406612e-05, "loss": 1.1819, "step": 18402 }, { "epoch": 0.5, "learning_rate": 1.0402342142993636e-05, "loss": 1.3154, "step": 18403 }, { "epoch": 0.5, "learning_rate": 1.0401458350432925e-05, "loss": 1.3086, "step": 18404 }, { "epoch": 0.5, "learning_rate": 1.0400574554731392e-05, "loss": 1.3445, "step": 18405 }, { "epoch": 0.5, "learning_rate": 1.039969075589595e-05, "loss": 1.2075, "step": 18406 }, { "epoch": 0.5, "learning_rate": 1.0398806953933517e-05, "loss": 1.2915, "step": 18407 }, { "epoch": 0.5, "learning_rate": 1.0397923148851008e-05, "loss": 1.1372, "step": 18408 }, { "epoch": 0.5, "learning_rate": 1.0397039340655332e-05, "loss": 1.2114, "step": 18409 }, { "epoch": 0.5, "learning_rate": 1.039615552935341e-05, "loss": 1.3574, "step": 18410 }, { "epoch": 0.5, "learning_rate": 1.0395271714952151e-05, "loss": 1.4312, "step": 18411 }, { "epoch": 0.5, "learning_rate": 1.0394387897458475e-05, "loss": 1.3274, "step": 18412 }, { "epoch": 0.5, "learning_rate": 1.0393504076879291e-05, "loss": 1.4043, "step": 18413 }, { "epoch": 0.5, "learning_rate": 1.0392620253221517e-05, "loss": 1.2061, "step": 18414 }, { "epoch": 0.5, "learning_rate": 1.0391736426492067e-05, "loss": 1.3186, "step": 18415 }, { "epoch": 0.5, "learning_rate": 1.0390852596697853e-05, "loss": 1.2605, "step": 18416 }, { "epoch": 0.5, "learning_rate": 1.0389968763845792e-05, "loss": 1.3137, "step": 18417 }, { "epoch": 0.5, "learning_rate": 1.0389084927942803e-05, "loss": 1.3052, "step": 18418 }, { "epoch": 0.5, "learning_rate": 1.0388201088995793e-05, "loss": 1.3406, "step": 18419 }, { "epoch": 0.5, "learning_rate": 1.0387317247011683e-05, "loss": 1.3684, "step": 18420 }, { "epoch": 0.5, "learning_rate": 1.0386433401997383e-05, "loss": 1.1643, "step": 18421 }, { "epoch": 0.5, "learning_rate": 1.038554955395981e-05, "loss": 1.2627, "step": 18422 }, { "epoch": 0.5, "learning_rate": 1.0384665702905878e-05, "loss": 1.2231, "step": 18423 }, { "epoch": 0.5, "learning_rate": 1.0383781848842505e-05, "loss": 1.3997, "step": 18424 }, { "epoch": 0.5, "learning_rate": 1.0382897991776602e-05, "loss": 1.3313, "step": 18425 }, { "epoch": 0.5, "learning_rate": 1.0382014131715085e-05, "loss": 1.4492, "step": 18426 }, { "epoch": 0.5, "learning_rate": 1.0381130268664868e-05, "loss": 1.3496, "step": 18427 }, { "epoch": 0.5, "learning_rate": 1.038024640263287e-05, "loss": 1.4407, "step": 18428 }, { "epoch": 0.5, "learning_rate": 1.0379362533625998e-05, "loss": 1.2087, "step": 18429 }, { "epoch": 0.5, "learning_rate": 1.0378478661651176e-05, "loss": 1.0739, "step": 18430 }, { "epoch": 0.5, "learning_rate": 1.0377594786715313e-05, "loss": 1.2708, "step": 18431 }, { "epoch": 0.5, "learning_rate": 1.0376710908825325e-05, "loss": 1.1833, "step": 18432 }, { "epoch": 0.5, "learning_rate": 1.037582702798813e-05, "loss": 1.2844, "step": 18433 }, { "epoch": 0.5, "learning_rate": 1.0374943144210641e-05, "loss": 1.3657, "step": 18434 }, { "epoch": 0.5, "learning_rate": 1.0374059257499773e-05, "loss": 1.2266, "step": 18435 }, { "epoch": 0.5, "learning_rate": 1.037317536786244e-05, "loss": 1.3779, "step": 18436 }, { "epoch": 0.5, "learning_rate": 1.037229147530556e-05, "loss": 1.4131, "step": 18437 }, { "epoch": 0.5, "learning_rate": 1.0371407579836046e-05, "loss": 1.3225, "step": 18438 }, { "epoch": 0.5, "learning_rate": 1.0370523681460816e-05, "loss": 1.0803, "step": 18439 }, { "epoch": 0.5, "learning_rate": 1.0369639780186777e-05, "loss": 1.4429, "step": 18440 }, { "epoch": 0.5, "learning_rate": 1.0368755876020858e-05, "loss": 1.1685, "step": 18441 }, { "epoch": 0.5, "learning_rate": 1.036787196896996e-05, "loss": 1.4126, "step": 18442 }, { "epoch": 0.5, "learning_rate": 1.0366988059041008e-05, "loss": 1.3076, "step": 18443 }, { "epoch": 0.5, "learning_rate": 1.0366104146240912e-05, "loss": 1.3647, "step": 18444 }, { "epoch": 0.5, "learning_rate": 1.0365220230576592e-05, "loss": 1.2856, "step": 18445 }, { "epoch": 0.5, "learning_rate": 1.0364336312054956e-05, "loss": 1.0881, "step": 18446 }, { "epoch": 0.5, "learning_rate": 1.0363452390682927e-05, "loss": 1.1941, "step": 18447 }, { "epoch": 0.5, "learning_rate": 1.0362568466467418e-05, "loss": 1.2634, "step": 18448 }, { "epoch": 0.5, "learning_rate": 1.0361684539415342e-05, "loss": 1.3137, "step": 18449 }, { "epoch": 0.5, "learning_rate": 1.0360800609533617e-05, "loss": 1.2605, "step": 18450 }, { "epoch": 0.5, "learning_rate": 1.035991667682916e-05, "loss": 1.2881, "step": 18451 }, { "epoch": 0.5, "learning_rate": 1.0359032741308881e-05, "loss": 1.3906, "step": 18452 }, { "epoch": 0.5, "learning_rate": 1.0358148802979702e-05, "loss": 1.2141, "step": 18453 }, { "epoch": 0.5, "learning_rate": 1.035726486184853e-05, "loss": 1.3774, "step": 18454 }, { "epoch": 0.5, "learning_rate": 1.035638091792229e-05, "loss": 1.3059, "step": 18455 }, { "epoch": 0.5, "learning_rate": 1.0355496971207893e-05, "loss": 1.1895, "step": 18456 }, { "epoch": 0.5, "learning_rate": 1.0354613021712254e-05, "loss": 1.1873, "step": 18457 }, { "epoch": 0.5, "learning_rate": 1.0353729069442288e-05, "loss": 1.2529, "step": 18458 }, { "epoch": 0.5, "learning_rate": 1.0352845114404915e-05, "loss": 1.2034, "step": 18459 }, { "epoch": 0.5, "learning_rate": 1.0351961156607046e-05, "loss": 1.2463, "step": 18460 }, { "epoch": 0.5, "learning_rate": 1.0351077196055598e-05, "loss": 1.2371, "step": 18461 }, { "epoch": 0.5, "learning_rate": 1.0350193232757488e-05, "loss": 1.4673, "step": 18462 }, { "epoch": 0.5, "learning_rate": 1.0349309266719629e-05, "loss": 1.1326, "step": 18463 }, { "epoch": 0.5, "learning_rate": 1.034842529794894e-05, "loss": 1.1704, "step": 18464 }, { "epoch": 0.5, "learning_rate": 1.0347541326452337e-05, "loss": 1.1912, "step": 18465 }, { "epoch": 0.5, "learning_rate": 1.0346657352236731e-05, "loss": 1.3784, "step": 18466 }, { "epoch": 0.5, "learning_rate": 1.0345773375309045e-05, "loss": 1.4358, "step": 18467 }, { "epoch": 0.5, "learning_rate": 1.0344889395676186e-05, "loss": 1.3076, "step": 18468 }, { "epoch": 0.5, "learning_rate": 1.0344005413345077e-05, "loss": 1.3672, "step": 18469 }, { "epoch": 0.5, "learning_rate": 1.0343121428322632e-05, "loss": 1.3022, "step": 18470 }, { "epoch": 0.5, "learning_rate": 1.0342237440615765e-05, "loss": 1.4478, "step": 18471 }, { "epoch": 0.5, "learning_rate": 1.0341353450231393e-05, "loss": 1.2644, "step": 18472 }, { "epoch": 0.5, "learning_rate": 1.0340469457176434e-05, "loss": 1.3669, "step": 18473 }, { "epoch": 0.5, "learning_rate": 1.0339585461457799e-05, "loss": 1.2476, "step": 18474 }, { "epoch": 0.5, "learning_rate": 1.033870146308241e-05, "loss": 1.1858, "step": 18475 }, { "epoch": 0.5, "learning_rate": 1.0337817462057179e-05, "loss": 1.3513, "step": 18476 }, { "epoch": 0.5, "learning_rate": 1.0336933458389025e-05, "loss": 1.3047, "step": 18477 }, { "epoch": 0.5, "learning_rate": 1.0336049452084858e-05, "loss": 1.2612, "step": 18478 }, { "epoch": 0.5, "learning_rate": 1.0335165443151598e-05, "loss": 1.1655, "step": 18479 }, { "epoch": 0.5, "learning_rate": 1.0334281431596163e-05, "loss": 1.3677, "step": 18480 }, { "epoch": 0.5, "learning_rate": 1.0333397417425468e-05, "loss": 1.3428, "step": 18481 }, { "epoch": 0.5, "learning_rate": 1.0332513400646427e-05, "loss": 1.1268, "step": 18482 }, { "epoch": 0.5, "learning_rate": 1.0331629381265959e-05, "loss": 1.311, "step": 18483 }, { "epoch": 0.5, "learning_rate": 1.0330745359290979e-05, "loss": 1.323, "step": 18484 }, { "epoch": 0.5, "learning_rate": 1.0329861334728402e-05, "loss": 1.2224, "step": 18485 }, { "epoch": 0.5, "learning_rate": 1.0328977307585144e-05, "loss": 1.303, "step": 18486 }, { "epoch": 0.5, "learning_rate": 1.0328093277868126e-05, "loss": 1.2798, "step": 18487 }, { "epoch": 0.5, "learning_rate": 1.0327209245584255e-05, "loss": 1.3, "step": 18488 }, { "epoch": 0.5, "learning_rate": 1.0326325210740455e-05, "loss": 1.1711, "step": 18489 }, { "epoch": 0.5, "learning_rate": 1.032544117334364e-05, "loss": 1.21, "step": 18490 }, { "epoch": 0.5, "learning_rate": 1.0324557133400728e-05, "loss": 1.3088, "step": 18491 }, { "epoch": 0.51, "learning_rate": 1.0323673090918631e-05, "loss": 1.3875, "step": 18492 }, { "epoch": 0.51, "learning_rate": 1.0322789045904272e-05, "loss": 1.2559, "step": 18493 }, { "epoch": 0.51, "learning_rate": 1.0321904998364558e-05, "loss": 1.2222, "step": 18494 }, { "epoch": 0.51, "learning_rate": 1.0321020948306413e-05, "loss": 1.2095, "step": 18495 }, { "epoch": 0.51, "learning_rate": 1.0320136895736752e-05, "loss": 1.3396, "step": 18496 }, { "epoch": 0.51, "learning_rate": 1.0319252840662489e-05, "loss": 1.3633, "step": 18497 }, { "epoch": 0.51, "learning_rate": 1.0318368783090544e-05, "loss": 1.4133, "step": 18498 }, { "epoch": 0.51, "learning_rate": 1.0317484723027829e-05, "loss": 1.2517, "step": 18499 }, { "epoch": 0.51, "learning_rate": 1.0316600660481265e-05, "loss": 1.3291, "step": 18500 }, { "epoch": 0.51, "learning_rate": 1.0315716595457762e-05, "loss": 1.3149, "step": 18501 }, { "epoch": 0.51, "learning_rate": 1.0314832527964248e-05, "loss": 1.2354, "step": 18502 }, { "epoch": 0.51, "learning_rate": 1.0313948458007626e-05, "loss": 1.332, "step": 18503 }, { "epoch": 0.51, "learning_rate": 1.0313064385594822e-05, "loss": 1.2307, "step": 18504 }, { "epoch": 0.51, "learning_rate": 1.0312180310732747e-05, "loss": 1.3455, "step": 18505 }, { "epoch": 0.51, "learning_rate": 1.0311296233428323e-05, "loss": 1.3076, "step": 18506 }, { "epoch": 0.51, "learning_rate": 1.031041215368846e-05, "loss": 1.3064, "step": 18507 }, { "epoch": 0.51, "learning_rate": 1.0309528071520082e-05, "loss": 1.2634, "step": 18508 }, { "epoch": 0.51, "learning_rate": 1.03086439869301e-05, "loss": 1.2729, "step": 18509 }, { "epoch": 0.51, "learning_rate": 1.0307759899925433e-05, "loss": 1.4482, "step": 18510 }, { "epoch": 0.51, "learning_rate": 1.0306875810512996e-05, "loss": 1.4375, "step": 18511 }, { "epoch": 0.51, "learning_rate": 1.0305991718699708e-05, "loss": 1.0681, "step": 18512 }, { "epoch": 0.51, "learning_rate": 1.0305107624492486e-05, "loss": 1.3479, "step": 18513 }, { "epoch": 0.51, "learning_rate": 1.0304223527898244e-05, "loss": 1.3076, "step": 18514 }, { "epoch": 0.51, "learning_rate": 1.03033394289239e-05, "loss": 1.2029, "step": 18515 }, { "epoch": 0.51, "learning_rate": 1.0302455327576372e-05, "loss": 1.2319, "step": 18516 }, { "epoch": 0.51, "learning_rate": 1.0301571223862574e-05, "loss": 1.3472, "step": 18517 }, { "epoch": 0.51, "learning_rate": 1.0300687117789427e-05, "loss": 1.1951, "step": 18518 }, { "epoch": 0.51, "learning_rate": 1.0299803009363845e-05, "loss": 1.2253, "step": 18519 }, { "epoch": 0.51, "learning_rate": 1.0298918898592744e-05, "loss": 1.2966, "step": 18520 }, { "epoch": 0.51, "learning_rate": 1.0298034785483042e-05, "loss": 1.2097, "step": 18521 }, { "epoch": 0.51, "learning_rate": 1.0297150670041657e-05, "loss": 1.3042, "step": 18522 }, { "epoch": 0.51, "learning_rate": 1.0296266552275504e-05, "loss": 1.3938, "step": 18523 }, { "epoch": 0.51, "learning_rate": 1.0295382432191503e-05, "loss": 1.676, "step": 18524 }, { "epoch": 0.51, "learning_rate": 1.0294498309796563e-05, "loss": 1.2126, "step": 18525 }, { "epoch": 0.51, "learning_rate": 1.0293614185097611e-05, "loss": 1.2036, "step": 18526 }, { "epoch": 0.51, "learning_rate": 1.0292730058101559e-05, "loss": 1.3638, "step": 18527 }, { "epoch": 0.51, "learning_rate": 1.0291845928815327e-05, "loss": 1.3103, "step": 18528 }, { "epoch": 0.51, "learning_rate": 1.0290961797245826e-05, "loss": 1.2354, "step": 18529 }, { "epoch": 0.51, "learning_rate": 1.029007766339998e-05, "loss": 1.189, "step": 18530 }, { "epoch": 0.51, "learning_rate": 1.02891935272847e-05, "loss": 1.2493, "step": 18531 }, { "epoch": 0.51, "learning_rate": 1.0288309388906908e-05, "loss": 1.3806, "step": 18532 }, { "epoch": 0.51, "learning_rate": 1.0287425248273516e-05, "loss": 1.1858, "step": 18533 }, { "epoch": 0.51, "learning_rate": 1.0286541105391447e-05, "loss": 1.3562, "step": 18534 }, { "epoch": 0.51, "learning_rate": 1.0285656960267613e-05, "loss": 1.3982, "step": 18535 }, { "epoch": 0.51, "learning_rate": 1.0284772812908936e-05, "loss": 1.2554, "step": 18536 }, { "epoch": 0.51, "learning_rate": 1.0283888663322328e-05, "loss": 1.3567, "step": 18537 }, { "epoch": 0.51, "learning_rate": 1.0283004511514712e-05, "loss": 1.2656, "step": 18538 }, { "epoch": 0.51, "learning_rate": 1.0282120357492997e-05, "loss": 1.158, "step": 18539 }, { "epoch": 0.51, "learning_rate": 1.028123620126411e-05, "loss": 1.1304, "step": 18540 }, { "epoch": 0.51, "learning_rate": 1.0280352042834959e-05, "loss": 1.2297, "step": 18541 }, { "epoch": 0.51, "learning_rate": 1.0279467882212464e-05, "loss": 1.3445, "step": 18542 }, { "epoch": 0.51, "learning_rate": 1.0278583719403548e-05, "loss": 1.2188, "step": 18543 }, { "epoch": 0.51, "learning_rate": 1.0277699554415121e-05, "loss": 1.3005, "step": 18544 }, { "epoch": 0.51, "learning_rate": 1.0276815387254106e-05, "loss": 1.4092, "step": 18545 }, { "epoch": 0.51, "learning_rate": 1.0275931217927416e-05, "loss": 1.186, "step": 18546 }, { "epoch": 0.51, "learning_rate": 1.027504704644197e-05, "loss": 1.3638, "step": 18547 }, { "epoch": 0.51, "learning_rate": 1.0274162872804685e-05, "loss": 1.2151, "step": 18548 }, { "epoch": 0.51, "learning_rate": 1.0273278697022479e-05, "loss": 1.5063, "step": 18549 }, { "epoch": 0.51, "learning_rate": 1.0272394519102268e-05, "loss": 1.2539, "step": 18550 }, { "epoch": 0.51, "learning_rate": 1.0271510339050974e-05, "loss": 1.3418, "step": 18551 }, { "epoch": 0.51, "learning_rate": 1.0270626156875507e-05, "loss": 1.282, "step": 18552 }, { "epoch": 0.51, "learning_rate": 1.026974197258279e-05, "loss": 1.1023, "step": 18553 }, { "epoch": 0.51, "learning_rate": 1.0268857786179737e-05, "loss": 1.5176, "step": 18554 }, { "epoch": 0.51, "learning_rate": 1.0267973597673268e-05, "loss": 1.3088, "step": 18555 }, { "epoch": 0.51, "learning_rate": 1.02670894070703e-05, "loss": 1.3074, "step": 18556 }, { "epoch": 0.51, "learning_rate": 1.026620521437775e-05, "loss": 1.0569, "step": 18557 }, { "epoch": 0.51, "learning_rate": 1.0265321019602535e-05, "loss": 1.2415, "step": 18558 }, { "epoch": 0.51, "learning_rate": 1.0264436822751573e-05, "loss": 1.2827, "step": 18559 }, { "epoch": 0.51, "learning_rate": 1.0263552623831781e-05, "loss": 1.2988, "step": 18560 }, { "epoch": 0.51, "learning_rate": 1.0262668422850079e-05, "loss": 1.2378, "step": 18561 }, { "epoch": 0.51, "learning_rate": 1.0261784219813381e-05, "loss": 1.196, "step": 18562 }, { "epoch": 0.51, "learning_rate": 1.0260900014728609e-05, "loss": 1.2693, "step": 18563 }, { "epoch": 0.51, "learning_rate": 1.0260015807602675e-05, "loss": 1.1865, "step": 18564 }, { "epoch": 0.51, "learning_rate": 1.0259131598442502e-05, "loss": 1.2942, "step": 18565 }, { "epoch": 0.51, "learning_rate": 1.0258247387255005e-05, "loss": 1.3928, "step": 18566 }, { "epoch": 0.51, "learning_rate": 1.0257363174047102e-05, "loss": 1.26, "step": 18567 }, { "epoch": 0.51, "learning_rate": 1.0256478958825708e-05, "loss": 1.2446, "step": 18568 }, { "epoch": 0.51, "learning_rate": 1.0255594741597746e-05, "loss": 1.228, "step": 18569 }, { "epoch": 0.51, "learning_rate": 1.0254710522370129e-05, "loss": 1.1694, "step": 18570 }, { "epoch": 0.51, "learning_rate": 1.0253826301149779e-05, "loss": 1.2712, "step": 18571 }, { "epoch": 0.51, "learning_rate": 1.0252942077943605e-05, "loss": 1.1912, "step": 18572 }, { "epoch": 0.51, "learning_rate": 1.025205785275854e-05, "loss": 1.2588, "step": 18573 }, { "epoch": 0.51, "learning_rate": 1.0251173625601486e-05, "loss": 1.3293, "step": 18574 }, { "epoch": 0.51, "learning_rate": 1.025028939647937e-05, "loss": 1.0344, "step": 18575 }, { "epoch": 0.51, "learning_rate": 1.024940516539911e-05, "loss": 1.428, "step": 18576 }, { "epoch": 0.51, "learning_rate": 1.0248520932367619e-05, "loss": 1.3186, "step": 18577 }, { "epoch": 0.51, "learning_rate": 1.0247636697391816e-05, "loss": 1.0967, "step": 18578 }, { "epoch": 0.51, "learning_rate": 1.0246752460478623e-05, "loss": 1.2283, "step": 18579 }, { "epoch": 0.51, "learning_rate": 1.0245868221634951e-05, "loss": 1.2964, "step": 18580 }, { "epoch": 0.51, "learning_rate": 1.0244983980867727e-05, "loss": 1.3125, "step": 18581 }, { "epoch": 0.51, "learning_rate": 1.0244099738183857e-05, "loss": 1.3491, "step": 18582 }, { "epoch": 0.51, "learning_rate": 1.024321549359027e-05, "loss": 1.428, "step": 18583 }, { "epoch": 0.51, "learning_rate": 1.0242331247093878e-05, "loss": 1.2107, "step": 18584 }, { "epoch": 0.51, "learning_rate": 1.02414469987016e-05, "loss": 1.3119, "step": 18585 }, { "epoch": 0.51, "learning_rate": 1.0240562748420354e-05, "loss": 1.2434, "step": 18586 }, { "epoch": 0.51, "learning_rate": 1.0239678496257057e-05, "loss": 1.1838, "step": 18587 }, { "epoch": 0.51, "learning_rate": 1.0238794242218632e-05, "loss": 1.7773, "step": 18588 }, { "epoch": 0.51, "learning_rate": 1.0237909986311991e-05, "loss": 1.3689, "step": 18589 }, { "epoch": 0.51, "learning_rate": 1.0237025728544055e-05, "loss": 1.2876, "step": 18590 }, { "epoch": 0.51, "learning_rate": 1.0236141468921738e-05, "loss": 1.5066, "step": 18591 }, { "epoch": 0.51, "learning_rate": 1.0235257207451964e-05, "loss": 1.2952, "step": 18592 }, { "epoch": 0.51, "learning_rate": 1.023437294414165e-05, "loss": 1.3511, "step": 18593 }, { "epoch": 0.51, "learning_rate": 1.0233488678997708e-05, "loss": 1.3245, "step": 18594 }, { "epoch": 0.51, "learning_rate": 1.0232604412027063e-05, "loss": 1.3823, "step": 18595 }, { "epoch": 0.51, "learning_rate": 1.0231720143236628e-05, "loss": 1.2646, "step": 18596 }, { "epoch": 0.51, "learning_rate": 1.0230835872633327e-05, "loss": 1.3625, "step": 18597 }, { "epoch": 0.51, "learning_rate": 1.0229951600224073e-05, "loss": 1.5093, "step": 18598 }, { "epoch": 0.51, "learning_rate": 1.0229067326015786e-05, "loss": 1.3105, "step": 18599 }, { "epoch": 0.51, "learning_rate": 1.0228183050015383e-05, "loss": 1.2322, "step": 18600 }, { "epoch": 0.51, "learning_rate": 1.0227298772229786e-05, "loss": 1.2739, "step": 18601 }, { "epoch": 0.51, "learning_rate": 1.0226414492665906e-05, "loss": 1.3567, "step": 18602 }, { "epoch": 0.51, "learning_rate": 1.0225530211330667e-05, "loss": 1.3621, "step": 18603 }, { "epoch": 0.51, "learning_rate": 1.0224645928230988e-05, "loss": 1.1748, "step": 18604 }, { "epoch": 0.51, "learning_rate": 1.0223761643373782e-05, "loss": 1.269, "step": 18605 }, { "epoch": 0.51, "learning_rate": 1.0222877356765971e-05, "loss": 1.2549, "step": 18606 }, { "epoch": 0.51, "learning_rate": 1.0221993068414472e-05, "loss": 1.2671, "step": 18607 }, { "epoch": 0.51, "learning_rate": 1.0221108778326205e-05, "loss": 1.3604, "step": 18608 }, { "epoch": 0.51, "learning_rate": 1.0220224486508086e-05, "loss": 1.4021, "step": 18609 }, { "epoch": 0.51, "learning_rate": 1.0219340192967036e-05, "loss": 1.3809, "step": 18610 }, { "epoch": 0.51, "learning_rate": 1.0218455897709969e-05, "loss": 1.2437, "step": 18611 }, { "epoch": 0.51, "learning_rate": 1.0217571600743807e-05, "loss": 1.4773, "step": 18612 }, { "epoch": 0.51, "learning_rate": 1.0216687302075467e-05, "loss": 1.3669, "step": 18613 }, { "epoch": 0.51, "learning_rate": 1.0215803001711868e-05, "loss": 1.2036, "step": 18614 }, { "epoch": 0.51, "learning_rate": 1.0214918699659926e-05, "loss": 1.3042, "step": 18615 }, { "epoch": 0.51, "learning_rate": 1.0214034395926565e-05, "loss": 1.2375, "step": 18616 }, { "epoch": 0.51, "learning_rate": 1.0213150090518693e-05, "loss": 1.2354, "step": 18617 }, { "epoch": 0.51, "learning_rate": 1.0212265783443238e-05, "loss": 1.2581, "step": 18618 }, { "epoch": 0.51, "learning_rate": 1.0211381474707116e-05, "loss": 1.3906, "step": 18619 }, { "epoch": 0.51, "learning_rate": 1.0210497164317246e-05, "loss": 1.2207, "step": 18620 }, { "epoch": 0.51, "learning_rate": 1.020961285228054e-05, "loss": 1.1614, "step": 18621 }, { "epoch": 0.51, "learning_rate": 1.0208728538603929e-05, "loss": 1.4053, "step": 18622 }, { "epoch": 0.51, "learning_rate": 1.0207844223294318e-05, "loss": 1.2219, "step": 18623 }, { "epoch": 0.51, "learning_rate": 1.0206959906358635e-05, "loss": 1.2427, "step": 18624 }, { "epoch": 0.51, "learning_rate": 1.0206075587803795e-05, "loss": 1.2307, "step": 18625 }, { "epoch": 0.51, "learning_rate": 1.0205191267636716e-05, "loss": 1.3687, "step": 18626 }, { "epoch": 0.51, "learning_rate": 1.0204306945864316e-05, "loss": 1.292, "step": 18627 }, { "epoch": 0.51, "learning_rate": 1.0203422622493517e-05, "loss": 1.2671, "step": 18628 }, { "epoch": 0.51, "learning_rate": 1.0202538297531232e-05, "loss": 1.4309, "step": 18629 }, { "epoch": 0.51, "learning_rate": 1.0201653970984385e-05, "loss": 1.2471, "step": 18630 }, { "epoch": 0.51, "learning_rate": 1.020076964285989e-05, "loss": 1.2051, "step": 18631 }, { "epoch": 0.51, "learning_rate": 1.019988531316467e-05, "loss": 1.177, "step": 18632 }, { "epoch": 0.51, "learning_rate": 1.0199000981905638e-05, "loss": 1.0947, "step": 18633 }, { "epoch": 0.51, "learning_rate": 1.0198116649089718e-05, "loss": 1.2678, "step": 18634 }, { "epoch": 0.51, "learning_rate": 1.0197232314723823e-05, "loss": 1.4082, "step": 18635 }, { "epoch": 0.51, "learning_rate": 1.019634797881488e-05, "loss": 1.0981, "step": 18636 }, { "epoch": 0.51, "learning_rate": 1.01954636413698e-05, "loss": 1.2415, "step": 18637 }, { "epoch": 0.51, "learning_rate": 1.0194579302395509e-05, "loss": 1.3296, "step": 18638 }, { "epoch": 0.51, "learning_rate": 1.0193694961898916e-05, "loss": 1.189, "step": 18639 }, { "epoch": 0.51, "learning_rate": 1.0192810619886948e-05, "loss": 1.3416, "step": 18640 }, { "epoch": 0.51, "learning_rate": 1.0191926276366518e-05, "loss": 1.1775, "step": 18641 }, { "epoch": 0.51, "learning_rate": 1.0191041931344547e-05, "loss": 1.2539, "step": 18642 }, { "epoch": 0.51, "learning_rate": 1.0190157584827952e-05, "loss": 1.3586, "step": 18643 }, { "epoch": 0.51, "learning_rate": 1.018927323682366e-05, "loss": 1.2502, "step": 18644 }, { "epoch": 0.51, "learning_rate": 1.0188388887338579e-05, "loss": 1.3398, "step": 18645 }, { "epoch": 0.51, "learning_rate": 1.018750453637963e-05, "loss": 1.2299, "step": 18646 }, { "epoch": 0.51, "learning_rate": 1.0186620183953736e-05, "loss": 1.2375, "step": 18647 }, { "epoch": 0.51, "learning_rate": 1.0185735830067816e-05, "loss": 1.1216, "step": 18648 }, { "epoch": 0.51, "learning_rate": 1.018485147472878e-05, "loss": 1.4155, "step": 18649 }, { "epoch": 0.51, "learning_rate": 1.0183967117943557e-05, "loss": 1.2537, "step": 18650 }, { "epoch": 0.51, "learning_rate": 1.0183082759719063e-05, "loss": 1.3381, "step": 18651 }, { "epoch": 0.51, "learning_rate": 1.0182198400062213e-05, "loss": 1.2499, "step": 18652 }, { "epoch": 0.51, "learning_rate": 1.018131403897993e-05, "loss": 1.3701, "step": 18653 }, { "epoch": 0.51, "learning_rate": 1.0180429676479129e-05, "loss": 1.3345, "step": 18654 }, { "epoch": 0.51, "learning_rate": 1.0179545312566734e-05, "loss": 1.192, "step": 18655 }, { "epoch": 0.51, "learning_rate": 1.0178660947249659e-05, "loss": 1.386, "step": 18656 }, { "epoch": 0.51, "learning_rate": 1.0177776580534825e-05, "loss": 1.1785, "step": 18657 }, { "epoch": 0.51, "learning_rate": 1.017689221242915e-05, "loss": 1.3904, "step": 18658 }, { "epoch": 0.51, "learning_rate": 1.0176007842939555e-05, "loss": 1.0974, "step": 18659 }, { "epoch": 0.51, "learning_rate": 1.0175123472072956e-05, "loss": 1.7256, "step": 18660 }, { "epoch": 0.51, "learning_rate": 1.0174239099836277e-05, "loss": 1.2976, "step": 18661 }, { "epoch": 0.51, "learning_rate": 1.0173354726236429e-05, "loss": 1.2185, "step": 18662 }, { "epoch": 0.51, "learning_rate": 1.0172470351280338e-05, "loss": 1.2913, "step": 18663 }, { "epoch": 0.51, "learning_rate": 1.0171585974974916e-05, "loss": 1.3108, "step": 18664 }, { "epoch": 0.51, "learning_rate": 1.0170701597327086e-05, "loss": 1.1907, "step": 18665 }, { "epoch": 0.51, "learning_rate": 1.016981721834377e-05, "loss": 1.2864, "step": 18666 }, { "epoch": 0.51, "learning_rate": 1.0168932838031885e-05, "loss": 1.2003, "step": 18667 }, { "epoch": 0.51, "learning_rate": 1.0168048456398345e-05, "loss": 1.2957, "step": 18668 }, { "epoch": 0.51, "learning_rate": 1.0167164073450075e-05, "loss": 1.2646, "step": 18669 }, { "epoch": 0.51, "learning_rate": 1.0166279689193992e-05, "loss": 1.2358, "step": 18670 }, { "epoch": 0.51, "learning_rate": 1.0165395303637016e-05, "loss": 1.3164, "step": 18671 }, { "epoch": 0.51, "learning_rate": 1.0164510916786063e-05, "loss": 1.3667, "step": 18672 }, { "epoch": 0.51, "learning_rate": 1.0163626528648057e-05, "loss": 1.322, "step": 18673 }, { "epoch": 0.51, "learning_rate": 1.016274213922991e-05, "loss": 1.3069, "step": 18674 }, { "epoch": 0.51, "learning_rate": 1.016185774853855e-05, "loss": 1.0938, "step": 18675 }, { "epoch": 0.51, "learning_rate": 1.0160973356580885e-05, "loss": 1.3181, "step": 18676 }, { "epoch": 0.51, "learning_rate": 1.0160088963363844e-05, "loss": 1.2688, "step": 18677 }, { "epoch": 0.51, "learning_rate": 1.0159204568894341e-05, "loss": 1.2009, "step": 18678 }, { "epoch": 0.51, "learning_rate": 1.0158320173179297e-05, "loss": 1.3899, "step": 18679 }, { "epoch": 0.51, "learning_rate": 1.0157435776225629e-05, "loss": 1.2488, "step": 18680 }, { "epoch": 0.51, "learning_rate": 1.0156551378040259e-05, "loss": 1.2407, "step": 18681 }, { "epoch": 0.51, "learning_rate": 1.01556669786301e-05, "loss": 1.2827, "step": 18682 }, { "epoch": 0.51, "learning_rate": 1.0154782578002082e-05, "loss": 1.1958, "step": 18683 }, { "epoch": 0.51, "learning_rate": 1.0153898176163114e-05, "loss": 1.2905, "step": 18684 }, { "epoch": 0.51, "learning_rate": 1.0153013773120124e-05, "loss": 1.3494, "step": 18685 }, { "epoch": 0.51, "learning_rate": 1.0152129368880021e-05, "loss": 1.3398, "step": 18686 }, { "epoch": 0.51, "learning_rate": 1.0151244963449734e-05, "loss": 1.3008, "step": 18687 }, { "epoch": 0.51, "learning_rate": 1.0150360556836174e-05, "loss": 1.0679, "step": 18688 }, { "epoch": 0.51, "learning_rate": 1.0149476149046265e-05, "loss": 1.2676, "step": 18689 }, { "epoch": 0.51, "learning_rate": 1.0148591740086923e-05, "loss": 1.1953, "step": 18690 }, { "epoch": 0.51, "learning_rate": 1.0147707329965073e-05, "loss": 1.3176, "step": 18691 }, { "epoch": 0.51, "learning_rate": 1.0146822918687626e-05, "loss": 1.1379, "step": 18692 }, { "epoch": 0.51, "learning_rate": 1.014593850626151e-05, "loss": 1.0574, "step": 18693 }, { "epoch": 0.51, "learning_rate": 1.0145054092693636e-05, "loss": 1.0898, "step": 18694 }, { "epoch": 0.51, "learning_rate": 1.014416967799093e-05, "loss": 1.3362, "step": 18695 }, { "epoch": 0.51, "learning_rate": 1.0143285262160304e-05, "loss": 1.4302, "step": 18696 }, { "epoch": 0.51, "learning_rate": 1.0142400845208684e-05, "loss": 1.2793, "step": 18697 }, { "epoch": 0.51, "learning_rate": 1.0141516427142987e-05, "loss": 1.3757, "step": 18698 }, { "epoch": 0.51, "learning_rate": 1.0140632007970131e-05, "loss": 1.6782, "step": 18699 }, { "epoch": 0.51, "learning_rate": 1.0139747587697038e-05, "loss": 1.1843, "step": 18700 }, { "epoch": 0.51, "learning_rate": 1.0138863166330624e-05, "loss": 1.2317, "step": 18701 }, { "epoch": 0.51, "learning_rate": 1.0137978743877812e-05, "loss": 1.2825, "step": 18702 }, { "epoch": 0.51, "learning_rate": 1.0137094320345515e-05, "loss": 1.2266, "step": 18703 }, { "epoch": 0.51, "learning_rate": 1.0136209895740661e-05, "loss": 1.2874, "step": 18704 }, { "epoch": 0.51, "learning_rate": 1.0135325470070163e-05, "loss": 1.3938, "step": 18705 }, { "epoch": 0.51, "learning_rate": 1.0134441043340944e-05, "loss": 1.2639, "step": 18706 }, { "epoch": 0.51, "learning_rate": 1.0133556615559916e-05, "loss": 1.2788, "step": 18707 }, { "epoch": 0.51, "learning_rate": 1.013267218673401e-05, "loss": 1.312, "step": 18708 }, { "epoch": 0.51, "learning_rate": 1.0131787756870135e-05, "loss": 1.2485, "step": 18709 }, { "epoch": 0.51, "learning_rate": 1.0130903325975217e-05, "loss": 1.3181, "step": 18710 }, { "epoch": 0.51, "learning_rate": 1.013001889405617e-05, "loss": 1.3303, "step": 18711 }, { "epoch": 0.51, "learning_rate": 1.0129134461119921e-05, "loss": 1.209, "step": 18712 }, { "epoch": 0.51, "learning_rate": 1.0128250027173379e-05, "loss": 1.2905, "step": 18713 }, { "epoch": 0.51, "learning_rate": 1.0127365592223475e-05, "loss": 1.2986, "step": 18714 }, { "epoch": 0.51, "learning_rate": 1.0126481156277116e-05, "loss": 1.3262, "step": 18715 }, { "epoch": 0.51, "learning_rate": 1.0125596719341235e-05, "loss": 1.3469, "step": 18716 }, { "epoch": 0.51, "learning_rate": 1.0124712281422739e-05, "loss": 1.2883, "step": 18717 }, { "epoch": 0.51, "learning_rate": 1.0123827842528558e-05, "loss": 1.3127, "step": 18718 }, { "epoch": 0.51, "learning_rate": 1.01229434026656e-05, "loss": 1.2742, "step": 18719 }, { "epoch": 0.51, "learning_rate": 1.0122058961840795e-05, "loss": 1.3464, "step": 18720 }, { "epoch": 0.51, "learning_rate": 1.0121174520061056e-05, "loss": 1.2551, "step": 18721 }, { "epoch": 0.51, "learning_rate": 1.0120290077333306e-05, "loss": 1.2542, "step": 18722 }, { "epoch": 0.51, "learning_rate": 1.011940563366446e-05, "loss": 1.209, "step": 18723 }, { "epoch": 0.51, "learning_rate": 1.0118521189061446e-05, "loss": 1.1995, "step": 18724 }, { "epoch": 0.51, "learning_rate": 1.0117636743531174e-05, "loss": 1.3892, "step": 18725 }, { "epoch": 0.51, "learning_rate": 1.0116752297080568e-05, "loss": 1.1919, "step": 18726 }, { "epoch": 0.51, "learning_rate": 1.0115867849716543e-05, "loss": 1.3591, "step": 18727 }, { "epoch": 0.51, "learning_rate": 1.0114983401446028e-05, "loss": 1.0824, "step": 18728 }, { "epoch": 0.51, "learning_rate": 1.0114098952275935e-05, "loss": 1.2561, "step": 18729 }, { "epoch": 0.51, "learning_rate": 1.0113214502213187e-05, "loss": 1.2346, "step": 18730 }, { "epoch": 0.51, "learning_rate": 1.01123300512647e-05, "loss": 1.1934, "step": 18731 }, { "epoch": 0.51, "learning_rate": 1.0111445599437398e-05, "loss": 1.3728, "step": 18732 }, { "epoch": 0.51, "learning_rate": 1.0110561146738193e-05, "loss": 1.3618, "step": 18733 }, { "epoch": 0.51, "learning_rate": 1.0109676693174015e-05, "loss": 1.2607, "step": 18734 }, { "epoch": 0.51, "learning_rate": 1.0108792238751774e-05, "loss": 1.2844, "step": 18735 }, { "epoch": 0.51, "learning_rate": 1.01079077834784e-05, "loss": 1.2166, "step": 18736 }, { "epoch": 0.51, "learning_rate": 1.0107023327360798e-05, "loss": 1.219, "step": 18737 }, { "epoch": 0.51, "learning_rate": 1.0106138870405902e-05, "loss": 1.2095, "step": 18738 }, { "epoch": 0.51, "learning_rate": 1.0105254412620622e-05, "loss": 1.2368, "step": 18739 }, { "epoch": 0.51, "learning_rate": 1.0104369954011883e-05, "loss": 1.3066, "step": 18740 }, { "epoch": 0.51, "learning_rate": 1.01034854945866e-05, "loss": 1.2815, "step": 18741 }, { "epoch": 0.51, "learning_rate": 1.0102601034351697e-05, "loss": 1.429, "step": 18742 }, { "epoch": 0.51, "learning_rate": 1.0101716573314092e-05, "loss": 1.354, "step": 18743 }, { "epoch": 0.51, "learning_rate": 1.0100832111480702e-05, "loss": 1.1494, "step": 18744 }, { "epoch": 0.51, "learning_rate": 1.0099947648858452e-05, "loss": 1.2717, "step": 18745 }, { "epoch": 0.51, "learning_rate": 1.0099063185454259e-05, "loss": 1.342, "step": 18746 }, { "epoch": 0.51, "learning_rate": 1.0098178721275039e-05, "loss": 1.1943, "step": 18747 }, { "epoch": 0.51, "learning_rate": 1.0097294256327719e-05, "loss": 1.4009, "step": 18748 }, { "epoch": 0.51, "learning_rate": 1.009640979061921e-05, "loss": 1.2026, "step": 18749 }, { "epoch": 0.51, "learning_rate": 1.009552532415644e-05, "loss": 1.2432, "step": 18750 }, { "epoch": 0.51, "learning_rate": 1.009464085694632e-05, "loss": 1.3108, "step": 18751 }, { "epoch": 0.51, "learning_rate": 1.0093756388995779e-05, "loss": 1.2415, "step": 18752 }, { "epoch": 0.51, "learning_rate": 1.0092871920311731e-05, "loss": 1.2493, "step": 18753 }, { "epoch": 0.51, "learning_rate": 1.0091987450901097e-05, "loss": 1.2537, "step": 18754 }, { "epoch": 0.51, "learning_rate": 1.0091102980770796e-05, "loss": 1.4092, "step": 18755 }, { "epoch": 0.51, "learning_rate": 1.0090218509927747e-05, "loss": 1.7144, "step": 18756 }, { "epoch": 0.51, "learning_rate": 1.0089334038378871e-05, "loss": 1.2922, "step": 18757 }, { "epoch": 0.51, "learning_rate": 1.0088449566131086e-05, "loss": 1.332, "step": 18758 }, { "epoch": 0.51, "learning_rate": 1.0087565093191318e-05, "loss": 1.136, "step": 18759 }, { "epoch": 0.51, "learning_rate": 1.0086680619566477e-05, "loss": 1.2043, "step": 18760 }, { "epoch": 0.51, "learning_rate": 1.008579614526349e-05, "loss": 1.3145, "step": 18761 }, { "epoch": 0.51, "learning_rate": 1.0084911670289274e-05, "loss": 1.0574, "step": 18762 }, { "epoch": 0.51, "learning_rate": 1.0084027194650752e-05, "loss": 1.1975, "step": 18763 }, { "epoch": 0.51, "learning_rate": 1.0083142718354838e-05, "loss": 1.3984, "step": 18764 }, { "epoch": 0.51, "learning_rate": 1.0082258241408454e-05, "loss": 1.1692, "step": 18765 }, { "epoch": 0.51, "learning_rate": 1.0081373763818519e-05, "loss": 1.2856, "step": 18766 }, { "epoch": 0.51, "learning_rate": 1.0080489285591957e-05, "loss": 1.1267, "step": 18767 }, { "epoch": 0.51, "learning_rate": 1.0079604806735682e-05, "loss": 1.3979, "step": 18768 }, { "epoch": 0.51, "learning_rate": 1.0078720327256619e-05, "loss": 1.2812, "step": 18769 }, { "epoch": 0.51, "learning_rate": 1.0077835847161684e-05, "loss": 1.3101, "step": 18770 }, { "epoch": 0.51, "learning_rate": 1.0076951366457796e-05, "loss": 1.1599, "step": 18771 }, { "epoch": 0.51, "learning_rate": 1.0076066885151878e-05, "loss": 1.2546, "step": 18772 }, { "epoch": 0.51, "learning_rate": 1.007518240325085e-05, "loss": 1.2842, "step": 18773 }, { "epoch": 0.51, "learning_rate": 1.0074297920761627e-05, "loss": 1.314, "step": 18774 }, { "epoch": 0.51, "learning_rate": 1.0073413437691136e-05, "loss": 1.2961, "step": 18775 }, { "epoch": 0.51, "learning_rate": 1.0072528954046287e-05, "loss": 1.2498, "step": 18776 }, { "epoch": 0.51, "learning_rate": 1.0071644469834013e-05, "loss": 1.3438, "step": 18777 }, { "epoch": 0.51, "learning_rate": 1.007075998506122e-05, "loss": 1.2346, "step": 18778 }, { "epoch": 0.51, "learning_rate": 1.0069875499734838e-05, "loss": 1.2952, "step": 18779 }, { "epoch": 0.51, "learning_rate": 1.0068991013861782e-05, "loss": 1.3345, "step": 18780 }, { "epoch": 0.51, "learning_rate": 1.0068106527448974e-05, "loss": 1.1204, "step": 18781 }, { "epoch": 0.51, "learning_rate": 1.0067222040503331e-05, "loss": 1.3086, "step": 18782 }, { "epoch": 0.51, "learning_rate": 1.0066337553031775e-05, "loss": 1.2664, "step": 18783 }, { "epoch": 0.51, "learning_rate": 1.0065453065041224e-05, "loss": 1.2432, "step": 18784 }, { "epoch": 0.51, "learning_rate": 1.00645685765386e-05, "loss": 1.292, "step": 18785 }, { "epoch": 0.51, "learning_rate": 1.006368408753082e-05, "loss": 1.2495, "step": 18786 }, { "epoch": 0.51, "learning_rate": 1.0062799598024809e-05, "loss": 1.2534, "step": 18787 }, { "epoch": 0.51, "learning_rate": 1.006191510802748e-05, "loss": 1.2676, "step": 18788 }, { "epoch": 0.51, "learning_rate": 1.0061030617545758e-05, "loss": 1.2612, "step": 18789 }, { "epoch": 0.51, "learning_rate": 1.0060146126586561e-05, "loss": 1.2988, "step": 18790 }, { "epoch": 0.51, "learning_rate": 1.0059261635156809e-05, "loss": 1.2866, "step": 18791 }, { "epoch": 0.51, "learning_rate": 1.005837714326342e-05, "loss": 1.2317, "step": 18792 }, { "epoch": 0.51, "learning_rate": 1.005749265091332e-05, "loss": 1.3344, "step": 18793 }, { "epoch": 0.51, "learning_rate": 1.005660815811342e-05, "loss": 1.3501, "step": 18794 }, { "epoch": 0.51, "learning_rate": 1.0055723664870649e-05, "loss": 1.1709, "step": 18795 }, { "epoch": 0.51, "learning_rate": 1.0054839171191919e-05, "loss": 1.2642, "step": 18796 }, { "epoch": 0.51, "learning_rate": 1.0053954677084155e-05, "loss": 1.3662, "step": 18797 }, { "epoch": 0.51, "learning_rate": 1.0053070182554272e-05, "loss": 1.2412, "step": 18798 }, { "epoch": 0.51, "learning_rate": 1.0052185687609197e-05, "loss": 1.1636, "step": 18799 }, { "epoch": 0.51, "learning_rate": 1.0051301192255843e-05, "loss": 1.3474, "step": 18800 }, { "epoch": 0.51, "learning_rate": 1.0050416696501133e-05, "loss": 1.2676, "step": 18801 }, { "epoch": 0.51, "learning_rate": 1.0049532200351986e-05, "loss": 1.2378, "step": 18802 }, { "epoch": 0.51, "learning_rate": 1.0048647703815325e-05, "loss": 1.1851, "step": 18803 }, { "epoch": 0.51, "learning_rate": 1.0047763206898063e-05, "loss": 1.2014, "step": 18804 }, { "epoch": 0.51, "learning_rate": 1.0046878709607124e-05, "loss": 1.1089, "step": 18805 }, { "epoch": 0.51, "learning_rate": 1.0045994211949433e-05, "loss": 1.29, "step": 18806 }, { "epoch": 0.51, "learning_rate": 1.00451097139319e-05, "loss": 1.3418, "step": 18807 }, { "epoch": 0.51, "learning_rate": 1.0044225215561453e-05, "loss": 1.3247, "step": 18808 }, { "epoch": 0.51, "learning_rate": 1.0043340716845007e-05, "loss": 1.2898, "step": 18809 }, { "epoch": 0.51, "learning_rate": 1.0042456217789486e-05, "loss": 1.3066, "step": 18810 }, { "epoch": 0.51, "learning_rate": 1.0041571718401805e-05, "loss": 1.3262, "step": 18811 }, { "epoch": 0.51, "learning_rate": 1.0040687218688887e-05, "loss": 1.1763, "step": 18812 }, { "epoch": 0.51, "learning_rate": 1.0039802718657652e-05, "loss": 1.3145, "step": 18813 }, { "epoch": 0.51, "learning_rate": 1.003891821831502e-05, "loss": 1.301, "step": 18814 }, { "epoch": 0.51, "learning_rate": 1.0038033717667907e-05, "loss": 1.25, "step": 18815 }, { "epoch": 0.51, "learning_rate": 1.003714921672324e-05, "loss": 1.1787, "step": 18816 }, { "epoch": 0.51, "learning_rate": 1.0036264715487932e-05, "loss": 1.4141, "step": 18817 }, { "epoch": 0.51, "learning_rate": 1.0035380213968909e-05, "loss": 1.3855, "step": 18818 }, { "epoch": 0.51, "learning_rate": 1.0034495712173084e-05, "loss": 1.2114, "step": 18819 }, { "epoch": 0.51, "learning_rate": 1.0033611210107382e-05, "loss": 1.1543, "step": 18820 }, { "epoch": 0.51, "learning_rate": 1.0032726707778722e-05, "loss": 1.7012, "step": 18821 }, { "epoch": 0.51, "learning_rate": 1.0031842205194024e-05, "loss": 1.3042, "step": 18822 }, { "epoch": 0.51, "learning_rate": 1.0030957702360206e-05, "loss": 1.3562, "step": 18823 }, { "epoch": 0.51, "learning_rate": 1.0030073199284191e-05, "loss": 1.2715, "step": 18824 }, { "epoch": 0.51, "learning_rate": 1.0029188695972898e-05, "loss": 1.2437, "step": 18825 }, { "epoch": 0.51, "learning_rate": 1.0028304192433247e-05, "loss": 1.3308, "step": 18826 }, { "epoch": 0.51, "learning_rate": 1.0027419688672156e-05, "loss": 1.364, "step": 18827 }, { "epoch": 0.51, "learning_rate": 1.0026535184696546e-05, "loss": 1.1418, "step": 18828 }, { "epoch": 0.51, "learning_rate": 1.0025650680513337e-05, "loss": 1.3333, "step": 18829 }, { "epoch": 0.51, "learning_rate": 1.002476617612945e-05, "loss": 1.3259, "step": 18830 }, { "epoch": 0.51, "learning_rate": 1.0023881671551802e-05, "loss": 1.2056, "step": 18831 }, { "epoch": 0.51, "learning_rate": 1.002299716678732e-05, "loss": 1.2148, "step": 18832 }, { "epoch": 0.51, "learning_rate": 1.0022112661842915e-05, "loss": 1.3098, "step": 18833 }, { "epoch": 0.51, "learning_rate": 1.0021228156725513e-05, "loss": 1.3081, "step": 18834 }, { "epoch": 0.51, "learning_rate": 1.0020343651442025e-05, "loss": 1.2634, "step": 18835 }, { "epoch": 0.51, "learning_rate": 1.0019459145999387e-05, "loss": 1.303, "step": 18836 }, { "epoch": 0.51, "learning_rate": 1.0018574640404504e-05, "loss": 1.3086, "step": 18837 }, { "epoch": 0.51, "learning_rate": 1.0017690134664307e-05, "loss": 1.4214, "step": 18838 }, { "epoch": 0.51, "learning_rate": 1.0016805628785707e-05, "loss": 1.3665, "step": 18839 }, { "epoch": 0.51, "learning_rate": 1.0015921122775628e-05, "loss": 1.2966, "step": 18840 }, { "epoch": 0.51, "learning_rate": 1.001503661664099e-05, "loss": 1.2385, "step": 18841 }, { "epoch": 0.51, "learning_rate": 1.0014152110388713e-05, "loss": 1.1555, "step": 18842 }, { "epoch": 0.51, "learning_rate": 1.0013267604025714e-05, "loss": 1.0928, "step": 18843 }, { "epoch": 0.51, "learning_rate": 1.001238309755892e-05, "loss": 1.4331, "step": 18844 }, { "epoch": 0.51, "learning_rate": 1.0011498590995242e-05, "loss": 1.1132, "step": 18845 }, { "epoch": 0.51, "learning_rate": 1.0010614084341609e-05, "loss": 1.3381, "step": 18846 }, { "epoch": 0.51, "learning_rate": 1.0009729577604932e-05, "loss": 1.3, "step": 18847 }, { "epoch": 0.51, "learning_rate": 1.0008845070792138e-05, "loss": 1.3345, "step": 18848 }, { "epoch": 0.51, "learning_rate": 1.0007960563910142e-05, "loss": 1.3054, "step": 18849 }, { "epoch": 0.51, "learning_rate": 1.000707605696587e-05, "loss": 1.4119, "step": 18850 }, { "epoch": 0.51, "learning_rate": 1.0006191549966236e-05, "loss": 1.3071, "step": 18851 }, { "epoch": 0.51, "learning_rate": 1.000530704291816e-05, "loss": 1.3975, "step": 18852 }, { "epoch": 0.51, "learning_rate": 1.0004422535828569e-05, "loss": 1.3684, "step": 18853 }, { "epoch": 0.51, "learning_rate": 1.0003538028704373e-05, "loss": 1.3008, "step": 18854 }, { "epoch": 0.51, "learning_rate": 1.00026535215525e-05, "loss": 1.4312, "step": 18855 }, { "epoch": 0.51, "learning_rate": 1.0001769014379868e-05, "loss": 1.3193, "step": 18856 }, { "epoch": 0.51, "learning_rate": 1.0000884507193395e-05, "loss": 1.2134, "step": 18857 }, { "epoch": 0.51, "learning_rate": 1e-05, "loss": 1.2703, "step": 18858 }, { "epoch": 0.52, "learning_rate": 9.999115492806606e-06, "loss": 1.1658, "step": 18859 }, { "epoch": 0.52, "learning_rate": 9.998230985620135e-06, "loss": 1.2715, "step": 18860 }, { "epoch": 0.52, "learning_rate": 9.997346478447501e-06, "loss": 1.2607, "step": 18861 }, { "epoch": 0.52, "learning_rate": 9.996461971295628e-06, "loss": 1.3176, "step": 18862 }, { "epoch": 0.52, "learning_rate": 9.995577464171436e-06, "loss": 1.1404, "step": 18863 }, { "epoch": 0.52, "learning_rate": 9.994692957081844e-06, "loss": 1.3953, "step": 18864 }, { "epoch": 0.52, "learning_rate": 9.993808450033768e-06, "loss": 1.365, "step": 18865 }, { "epoch": 0.52, "learning_rate": 9.992923943034135e-06, "loss": 1.1274, "step": 18866 }, { "epoch": 0.52, "learning_rate": 9.99203943608986e-06, "loss": 1.2529, "step": 18867 }, { "epoch": 0.52, "learning_rate": 9.991154929207867e-06, "loss": 1.2786, "step": 18868 }, { "epoch": 0.52, "learning_rate": 9.990270422395071e-06, "loss": 1.2122, "step": 18869 }, { "epoch": 0.52, "learning_rate": 9.989385915658396e-06, "loss": 1.4478, "step": 18870 }, { "epoch": 0.52, "learning_rate": 9.98850140900476e-06, "loss": 1.2791, "step": 18871 }, { "epoch": 0.52, "learning_rate": 9.987616902441087e-06, "loss": 1.3813, "step": 18872 }, { "epoch": 0.52, "learning_rate": 9.986732395974289e-06, "loss": 1.3525, "step": 18873 }, { "epoch": 0.52, "learning_rate": 9.985847889611288e-06, "loss": 1.415, "step": 18874 }, { "epoch": 0.52, "learning_rate": 9.984963383359015e-06, "loss": 1.3682, "step": 18875 }, { "epoch": 0.52, "learning_rate": 9.984078877224372e-06, "loss": 1.3638, "step": 18876 }, { "epoch": 0.52, "learning_rate": 9.983194371214298e-06, "loss": 1.2607, "step": 18877 }, { "epoch": 0.52, "learning_rate": 9.982309865335695e-06, "loss": 1.2866, "step": 18878 }, { "epoch": 0.52, "learning_rate": 9.981425359595497e-06, "loss": 1.4258, "step": 18879 }, { "epoch": 0.52, "learning_rate": 9.980540854000615e-06, "loss": 1.4895, "step": 18880 }, { "epoch": 0.52, "learning_rate": 9.979656348557976e-06, "loss": 1.1499, "step": 18881 }, { "epoch": 0.52, "learning_rate": 9.97877184327449e-06, "loss": 1.2554, "step": 18882 }, { "epoch": 0.52, "learning_rate": 9.97788733815709e-06, "loss": 1.3054, "step": 18883 }, { "epoch": 0.52, "learning_rate": 9.977002833212683e-06, "loss": 1.2773, "step": 18884 }, { "epoch": 0.52, "learning_rate": 9.976118328448201e-06, "loss": 1.2468, "step": 18885 }, { "epoch": 0.52, "learning_rate": 9.975233823870551e-06, "loss": 1.1947, "step": 18886 }, { "epoch": 0.52, "learning_rate": 9.974349319486668e-06, "loss": 1.4152, "step": 18887 }, { "epoch": 0.52, "learning_rate": 9.973464815303456e-06, "loss": 1.3435, "step": 18888 }, { "epoch": 0.52, "learning_rate": 9.97258031132785e-06, "loss": 1.3491, "step": 18889 }, { "epoch": 0.52, "learning_rate": 9.971695807566756e-06, "loss": 1.3503, "step": 18890 }, { "epoch": 0.52, "learning_rate": 9.970811304027102e-06, "loss": 1.3674, "step": 18891 }, { "epoch": 0.52, "learning_rate": 9.96992680071581e-06, "loss": 1.4043, "step": 18892 }, { "epoch": 0.52, "learning_rate": 9.969042297639794e-06, "loss": 1.2854, "step": 18893 }, { "epoch": 0.52, "learning_rate": 9.96815779480598e-06, "loss": 1.3052, "step": 18894 }, { "epoch": 0.52, "learning_rate": 9.96727329222128e-06, "loss": 1.3425, "step": 18895 }, { "epoch": 0.52, "learning_rate": 9.966388789892622e-06, "loss": 1.3411, "step": 18896 }, { "epoch": 0.52, "learning_rate": 9.965504287826919e-06, "loss": 1.2825, "step": 18897 }, { "epoch": 0.52, "learning_rate": 9.964619786031096e-06, "loss": 1.3462, "step": 18898 }, { "epoch": 0.52, "learning_rate": 9.96373528451207e-06, "loss": 1.2346, "step": 18899 }, { "epoch": 0.52, "learning_rate": 9.962850783276764e-06, "loss": 1.7593, "step": 18900 }, { "epoch": 0.52, "learning_rate": 9.961966282332094e-06, "loss": 1.3438, "step": 18901 }, { "epoch": 0.52, "learning_rate": 9.961081781684985e-06, "loss": 1.2068, "step": 18902 }, { "epoch": 0.52, "learning_rate": 9.960197281342351e-06, "loss": 1.2437, "step": 18903 }, { "epoch": 0.52, "learning_rate": 9.959312781311116e-06, "loss": 1.4312, "step": 18904 }, { "epoch": 0.52, "learning_rate": 9.958428281598198e-06, "loss": 1.2001, "step": 18905 }, { "epoch": 0.52, "learning_rate": 9.957543782210517e-06, "loss": 1.29, "step": 18906 }, { "epoch": 0.52, "learning_rate": 9.956659283154997e-06, "loss": 1.3462, "step": 18907 }, { "epoch": 0.52, "learning_rate": 9.955774784438548e-06, "loss": 1.3589, "step": 18908 }, { "epoch": 0.52, "learning_rate": 9.954890286068101e-06, "loss": 1.2529, "step": 18909 }, { "epoch": 0.52, "learning_rate": 9.95400578805057e-06, "loss": 1.269, "step": 18910 }, { "epoch": 0.52, "learning_rate": 9.953121290392878e-06, "loss": 1.8535, "step": 18911 }, { "epoch": 0.52, "learning_rate": 9.95223679310194e-06, "loss": 1.2751, "step": 18912 }, { "epoch": 0.52, "learning_rate": 9.951352296184682e-06, "loss": 1.2651, "step": 18913 }, { "epoch": 0.52, "learning_rate": 9.950467799648017e-06, "loss": 1.3113, "step": 18914 }, { "epoch": 0.52, "learning_rate": 9.949583303498872e-06, "loss": 1.2048, "step": 18915 }, { "epoch": 0.52, "learning_rate": 9.948698807744162e-06, "loss": 1.3752, "step": 18916 }, { "epoch": 0.52, "learning_rate": 9.94781431239081e-06, "loss": 1.1663, "step": 18917 }, { "epoch": 0.52, "learning_rate": 9.946929817445731e-06, "loss": 1.2834, "step": 18918 }, { "epoch": 0.52, "learning_rate": 9.94604532291585e-06, "loss": 1.2002, "step": 18919 }, { "epoch": 0.52, "learning_rate": 9.945160828808085e-06, "loss": 1.1799, "step": 18920 }, { "epoch": 0.52, "learning_rate": 9.944276335129353e-06, "loss": 1.3828, "step": 18921 }, { "epoch": 0.52, "learning_rate": 9.94339184188658e-06, "loss": 1.3752, "step": 18922 }, { "epoch": 0.52, "learning_rate": 9.942507349086682e-06, "loss": 1.3225, "step": 18923 }, { "epoch": 0.52, "learning_rate": 9.941622856736582e-06, "loss": 1.3394, "step": 18924 }, { "epoch": 0.52, "learning_rate": 9.940738364843193e-06, "loss": 1.1394, "step": 18925 }, { "epoch": 0.52, "learning_rate": 9.939853873413444e-06, "loss": 1.0483, "step": 18926 }, { "epoch": 0.52, "learning_rate": 9.938969382454244e-06, "loss": 1.2598, "step": 18927 }, { "epoch": 0.52, "learning_rate": 9.938084891972524e-06, "loss": 1.252, "step": 18928 }, { "epoch": 0.52, "learning_rate": 9.937200401975193e-06, "loss": 1.407, "step": 18929 }, { "epoch": 0.52, "learning_rate": 9.936315912469184e-06, "loss": 1.2932, "step": 18930 }, { "epoch": 0.52, "learning_rate": 9.935431423461403e-06, "loss": 1.4155, "step": 18931 }, { "epoch": 0.52, "learning_rate": 9.934546934958783e-06, "loss": 1.3262, "step": 18932 }, { "epoch": 0.52, "learning_rate": 9.933662446968228e-06, "loss": 1.1653, "step": 18933 }, { "epoch": 0.52, "learning_rate": 9.932777959496676e-06, "loss": 1.4312, "step": 18934 }, { "epoch": 0.52, "learning_rate": 9.93189347255103e-06, "loss": 1.4365, "step": 18935 }, { "epoch": 0.52, "learning_rate": 9.93100898613822e-06, "loss": 1.324, "step": 18936 }, { "epoch": 0.52, "learning_rate": 9.930124500265164e-06, "loss": 1.3447, "step": 18937 }, { "epoch": 0.52, "learning_rate": 9.92924001493878e-06, "loss": 1.3335, "step": 18938 }, { "epoch": 0.52, "learning_rate": 9.92835553016599e-06, "loss": 1.2471, "step": 18939 }, { "epoch": 0.52, "learning_rate": 9.927471045953713e-06, "loss": 1.2688, "step": 18940 }, { "epoch": 0.52, "learning_rate": 9.926586562308869e-06, "loss": 1.2043, "step": 18941 }, { "epoch": 0.52, "learning_rate": 9.925702079238375e-06, "loss": 1.176, "step": 18942 }, { "epoch": 0.52, "learning_rate": 9.924817596749155e-06, "loss": 1.2866, "step": 18943 }, { "epoch": 0.52, "learning_rate": 9.923933114848125e-06, "loss": 1.1636, "step": 18944 }, { "epoch": 0.52, "learning_rate": 9.923048633542209e-06, "loss": 1.3834, "step": 18945 }, { "epoch": 0.52, "learning_rate": 9.922164152838321e-06, "loss": 1.3655, "step": 18946 }, { "epoch": 0.52, "learning_rate": 9.921279672743388e-06, "loss": 1.2834, "step": 18947 }, { "epoch": 0.52, "learning_rate": 9.92039519326432e-06, "loss": 1.1582, "step": 18948 }, { "epoch": 0.52, "learning_rate": 9.919510714408048e-06, "loss": 1.3206, "step": 18949 }, { "epoch": 0.52, "learning_rate": 9.918626236181483e-06, "loss": 1.2188, "step": 18950 }, { "epoch": 0.52, "learning_rate": 9.917741758591551e-06, "loss": 1.3586, "step": 18951 }, { "epoch": 0.52, "learning_rate": 9.916857281645167e-06, "loss": 1.325, "step": 18952 }, { "epoch": 0.52, "learning_rate": 9.915972805349253e-06, "loss": 1.2573, "step": 18953 }, { "epoch": 0.52, "learning_rate": 9.915088329710729e-06, "loss": 1.2507, "step": 18954 }, { "epoch": 0.52, "learning_rate": 9.914203854736511e-06, "loss": 1.239, "step": 18955 }, { "epoch": 0.52, "learning_rate": 9.913319380433524e-06, "loss": 1.4556, "step": 18956 }, { "epoch": 0.52, "learning_rate": 9.912434906808686e-06, "loss": 1.1541, "step": 18957 }, { "epoch": 0.52, "learning_rate": 9.911550433868915e-06, "loss": 1.1915, "step": 18958 }, { "epoch": 0.52, "learning_rate": 9.910665961621132e-06, "loss": 1.1755, "step": 18959 }, { "epoch": 0.52, "learning_rate": 9.909781490072258e-06, "loss": 1.3782, "step": 18960 }, { "epoch": 0.52, "learning_rate": 9.90889701922921e-06, "loss": 1.218, "step": 18961 }, { "epoch": 0.52, "learning_rate": 9.908012549098908e-06, "loss": 1.3679, "step": 18962 }, { "epoch": 0.52, "learning_rate": 9.907128079688272e-06, "loss": 1.2471, "step": 18963 }, { "epoch": 0.52, "learning_rate": 9.906243611004226e-06, "loss": 1.2467, "step": 18964 }, { "epoch": 0.52, "learning_rate": 9.905359143053683e-06, "loss": 1.3779, "step": 18965 }, { "epoch": 0.52, "learning_rate": 9.904474675843566e-06, "loss": 1.3362, "step": 18966 }, { "epoch": 0.52, "learning_rate": 9.903590209380794e-06, "loss": 1.3198, "step": 18967 }, { "epoch": 0.52, "learning_rate": 9.902705743672283e-06, "loss": 1.2952, "step": 18968 }, { "epoch": 0.52, "learning_rate": 9.901821278724963e-06, "loss": 1.1411, "step": 18969 }, { "epoch": 0.52, "learning_rate": 9.900936814545743e-06, "loss": 1.2375, "step": 18970 }, { "epoch": 0.52, "learning_rate": 9.900052351141551e-06, "loss": 1.3435, "step": 18971 }, { "epoch": 0.52, "learning_rate": 9.899167888519296e-06, "loss": 1.3853, "step": 18972 }, { "epoch": 0.52, "learning_rate": 9.898283426685912e-06, "loss": 1.323, "step": 18973 }, { "epoch": 0.52, "learning_rate": 9.897398965648304e-06, "loss": 1.2136, "step": 18974 }, { "epoch": 0.52, "learning_rate": 9.896514505413402e-06, "loss": 1.1138, "step": 18975 }, { "epoch": 0.52, "learning_rate": 9.89563004598812e-06, "loss": 1.2144, "step": 18976 }, { "epoch": 0.52, "learning_rate": 9.89474558737938e-06, "loss": 1.1887, "step": 18977 }, { "epoch": 0.52, "learning_rate": 9.893861129594101e-06, "loss": 1.2251, "step": 18978 }, { "epoch": 0.52, "learning_rate": 9.892976672639203e-06, "loss": 1.1978, "step": 18979 }, { "epoch": 0.52, "learning_rate": 9.892092216521606e-06, "loss": 1.262, "step": 18980 }, { "epoch": 0.52, "learning_rate": 9.891207761248227e-06, "loss": 1.3601, "step": 18981 }, { "epoch": 0.52, "learning_rate": 9.890323306825988e-06, "loss": 1.4746, "step": 18982 }, { "epoch": 0.52, "learning_rate": 9.889438853261805e-06, "loss": 1.302, "step": 18983 }, { "epoch": 0.52, "learning_rate": 9.888554400562605e-06, "loss": 1.2781, "step": 18984 }, { "epoch": 0.52, "learning_rate": 9.887669948735301e-06, "loss": 1.2908, "step": 18985 }, { "epoch": 0.52, "learning_rate": 9.886785497786817e-06, "loss": 1.1592, "step": 18986 }, { "epoch": 0.52, "learning_rate": 9.885901047724066e-06, "loss": 1.2004, "step": 18987 }, { "epoch": 0.52, "learning_rate": 9.885016598553975e-06, "loss": 1.3406, "step": 18988 }, { "epoch": 0.52, "learning_rate": 9.884132150283457e-06, "loss": 1.1206, "step": 18989 }, { "epoch": 0.52, "learning_rate": 9.883247702919437e-06, "loss": 1.2844, "step": 18990 }, { "epoch": 0.52, "learning_rate": 9.88236325646883e-06, "loss": 1.3352, "step": 18991 }, { "epoch": 0.52, "learning_rate": 9.88147881093856e-06, "loss": 1.25, "step": 18992 }, { "epoch": 0.52, "learning_rate": 9.880594366335541e-06, "loss": 1.323, "step": 18993 }, { "epoch": 0.52, "learning_rate": 9.879709922666699e-06, "loss": 1.4053, "step": 18994 }, { "epoch": 0.52, "learning_rate": 9.878825479938947e-06, "loss": 1.2308, "step": 18995 }, { "epoch": 0.52, "learning_rate": 9.87794103815921e-06, "loss": 1.1841, "step": 18996 }, { "epoch": 0.52, "learning_rate": 9.877056597334403e-06, "loss": 1.2061, "step": 18997 }, { "epoch": 0.52, "learning_rate": 9.876172157471447e-06, "loss": 1.2019, "step": 18998 }, { "epoch": 0.52, "learning_rate": 9.875287718577263e-06, "loss": 1.3762, "step": 18999 }, { "epoch": 0.52, "learning_rate": 9.874403280658768e-06, "loss": 1.2529, "step": 19000 }, { "epoch": 0.52, "learning_rate": 9.873518843722885e-06, "loss": 1.1592, "step": 19001 }, { "epoch": 0.52, "learning_rate": 9.872634407776529e-06, "loss": 1.3484, "step": 19002 }, { "epoch": 0.52, "learning_rate": 9.871749972826623e-06, "loss": 1.1074, "step": 19003 }, { "epoch": 0.52, "learning_rate": 9.870865538880084e-06, "loss": 1.1481, "step": 19004 }, { "epoch": 0.52, "learning_rate": 9.869981105943833e-06, "loss": 1.4209, "step": 19005 }, { "epoch": 0.52, "learning_rate": 9.869096674024788e-06, "loss": 1.3066, "step": 19006 }, { "epoch": 0.52, "learning_rate": 9.86821224312987e-06, "loss": 1.2202, "step": 19007 }, { "epoch": 0.52, "learning_rate": 9.867327813265994e-06, "loss": 1.2327, "step": 19008 }, { "epoch": 0.52, "learning_rate": 9.866443384440088e-06, "loss": 1.3872, "step": 19009 }, { "epoch": 0.52, "learning_rate": 9.865558956659061e-06, "loss": 1.3024, "step": 19010 }, { "epoch": 0.52, "learning_rate": 9.864674529929842e-06, "loss": 1.4299, "step": 19011 }, { "epoch": 0.52, "learning_rate": 9.863790104259342e-06, "loss": 1.3665, "step": 19012 }, { "epoch": 0.52, "learning_rate": 9.86290567965449e-06, "loss": 1.4141, "step": 19013 }, { "epoch": 0.52, "learning_rate": 9.862021256122191e-06, "loss": 1.3928, "step": 19014 }, { "epoch": 0.52, "learning_rate": 9.861136833669378e-06, "loss": 1.4214, "step": 19015 }, { "epoch": 0.52, "learning_rate": 9.860252412302965e-06, "loss": 1.7671, "step": 19016 }, { "epoch": 0.52, "learning_rate": 9.85936799202987e-06, "loss": 1.2761, "step": 19017 }, { "epoch": 0.52, "learning_rate": 9.858483572857016e-06, "loss": 1.1719, "step": 19018 }, { "epoch": 0.52, "learning_rate": 9.857599154791318e-06, "loss": 1.4038, "step": 19019 }, { "epoch": 0.52, "learning_rate": 9.856714737839699e-06, "loss": 1.3633, "step": 19020 }, { "epoch": 0.52, "learning_rate": 9.855830322009075e-06, "loss": 1.2, "step": 19021 }, { "epoch": 0.52, "learning_rate": 9.854945907306368e-06, "loss": 1.2722, "step": 19022 }, { "epoch": 0.52, "learning_rate": 9.854061493738494e-06, "loss": 1.2744, "step": 19023 }, { "epoch": 0.52, "learning_rate": 9.853177081312376e-06, "loss": 1.2598, "step": 19024 }, { "epoch": 0.52, "learning_rate": 9.85229267003493e-06, "loss": 1.1936, "step": 19025 }, { "epoch": 0.52, "learning_rate": 9.851408259913078e-06, "loss": 1.3291, "step": 19026 }, { "epoch": 0.52, "learning_rate": 9.850523850953737e-06, "loss": 1.0898, "step": 19027 }, { "epoch": 0.52, "learning_rate": 9.84963944316383e-06, "loss": 1.1543, "step": 19028 }, { "epoch": 0.52, "learning_rate": 9.84875503655027e-06, "loss": 1.4258, "step": 19029 }, { "epoch": 0.52, "learning_rate": 9.847870631119979e-06, "loss": 1.3752, "step": 19030 }, { "epoch": 0.52, "learning_rate": 9.846986226879878e-06, "loss": 1.2986, "step": 19031 }, { "epoch": 0.52, "learning_rate": 9.846101823836884e-06, "loss": 1.2695, "step": 19032 }, { "epoch": 0.52, "learning_rate": 9.84521742199792e-06, "loss": 1.2805, "step": 19033 }, { "epoch": 0.52, "learning_rate": 9.844333021369898e-06, "loss": 1.3982, "step": 19034 }, { "epoch": 0.52, "learning_rate": 9.843448621959745e-06, "loss": 1.2124, "step": 19035 }, { "epoch": 0.52, "learning_rate": 9.842564223774373e-06, "loss": 1.2178, "step": 19036 }, { "epoch": 0.52, "learning_rate": 9.841679826820708e-06, "loss": 1.2092, "step": 19037 }, { "epoch": 0.52, "learning_rate": 9.840795431105662e-06, "loss": 1.2646, "step": 19038 }, { "epoch": 0.52, "learning_rate": 9.839911036636161e-06, "loss": 1.3057, "step": 19039 }, { "epoch": 0.52, "learning_rate": 9.839026643419116e-06, "loss": 1.2681, "step": 19040 }, { "epoch": 0.52, "learning_rate": 9.838142251461456e-06, "loss": 1.3679, "step": 19041 }, { "epoch": 0.52, "learning_rate": 9.837257860770093e-06, "loss": 1.2117, "step": 19042 }, { "epoch": 0.52, "learning_rate": 9.836373471351949e-06, "loss": 1.4109, "step": 19043 }, { "epoch": 0.52, "learning_rate": 9.835489083213939e-06, "loss": 1.2231, "step": 19044 }, { "epoch": 0.52, "learning_rate": 9.834604696362984e-06, "loss": 1.1265, "step": 19045 }, { "epoch": 0.52, "learning_rate": 9.833720310806011e-06, "loss": 1.2756, "step": 19046 }, { "epoch": 0.52, "learning_rate": 9.832835926549924e-06, "loss": 1.2258, "step": 19047 }, { "epoch": 0.52, "learning_rate": 9.831951543601657e-06, "loss": 1.0532, "step": 19048 }, { "epoch": 0.52, "learning_rate": 9.831067161968117e-06, "loss": 1.3513, "step": 19049 }, { "epoch": 0.52, "learning_rate": 9.830182781656234e-06, "loss": 1.2561, "step": 19050 }, { "epoch": 0.52, "learning_rate": 9.829298402672913e-06, "loss": 1.168, "step": 19051 }, { "epoch": 0.52, "learning_rate": 9.82841402502509e-06, "loss": 1.3645, "step": 19052 }, { "epoch": 0.52, "learning_rate": 9.827529648719667e-06, "loss": 1.2627, "step": 19053 }, { "epoch": 0.52, "learning_rate": 9.826645273763578e-06, "loss": 1.2283, "step": 19054 }, { "epoch": 0.52, "learning_rate": 9.825760900163728e-06, "loss": 1.0493, "step": 19055 }, { "epoch": 0.52, "learning_rate": 9.82487652792705e-06, "loss": 1.1257, "step": 19056 }, { "epoch": 0.52, "learning_rate": 9.823992157060447e-06, "loss": 1.3481, "step": 19057 }, { "epoch": 0.52, "learning_rate": 9.823107787570855e-06, "loss": 1.2841, "step": 19058 }, { "epoch": 0.52, "learning_rate": 9.822223419465178e-06, "loss": 1.1729, "step": 19059 }, { "epoch": 0.52, "learning_rate": 9.821339052750343e-06, "loss": 1.343, "step": 19060 }, { "epoch": 0.52, "learning_rate": 9.820454687433269e-06, "loss": 1.3494, "step": 19061 }, { "epoch": 0.52, "learning_rate": 9.819570323520871e-06, "loss": 1.374, "step": 19062 }, { "epoch": 0.52, "learning_rate": 9.818685961020074e-06, "loss": 1.3091, "step": 19063 }, { "epoch": 0.52, "learning_rate": 9.817801599937789e-06, "loss": 1.363, "step": 19064 }, { "epoch": 0.52, "learning_rate": 9.81691724028094e-06, "loss": 1.2139, "step": 19065 }, { "epoch": 0.52, "learning_rate": 9.816032882056443e-06, "loss": 1.2761, "step": 19066 }, { "epoch": 0.52, "learning_rate": 9.81514852527122e-06, "loss": 1.1177, "step": 19067 }, { "epoch": 0.52, "learning_rate": 9.814264169932187e-06, "loss": 1.1936, "step": 19068 }, { "epoch": 0.52, "learning_rate": 9.813379816046265e-06, "loss": 1.2786, "step": 19069 }, { "epoch": 0.52, "learning_rate": 9.812495463620371e-06, "loss": 1.4717, "step": 19070 }, { "epoch": 0.52, "learning_rate": 9.811611112661426e-06, "loss": 1.3931, "step": 19071 }, { "epoch": 0.52, "learning_rate": 9.810726763176344e-06, "loss": 1.3208, "step": 19072 }, { "epoch": 0.52, "learning_rate": 9.80984241517205e-06, "loss": 1.3459, "step": 19073 }, { "epoch": 0.52, "learning_rate": 9.808958068655455e-06, "loss": 1.3296, "step": 19074 }, { "epoch": 0.52, "learning_rate": 9.808073723633486e-06, "loss": 1.3376, "step": 19075 }, { "epoch": 0.52, "learning_rate": 9.807189380113055e-06, "loss": 1.3425, "step": 19076 }, { "epoch": 0.52, "learning_rate": 9.806305038101085e-06, "loss": 1.3433, "step": 19077 }, { "epoch": 0.52, "learning_rate": 9.805420697604495e-06, "loss": 1.3621, "step": 19078 }, { "epoch": 0.52, "learning_rate": 9.804536358630198e-06, "loss": 1.3015, "step": 19079 }, { "epoch": 0.52, "learning_rate": 9.803652021185122e-06, "loss": 1.2727, "step": 19080 }, { "epoch": 0.52, "learning_rate": 9.802767685276177e-06, "loss": 1.2974, "step": 19081 }, { "epoch": 0.52, "learning_rate": 9.801883350910287e-06, "loss": 1.3848, "step": 19082 }, { "epoch": 0.52, "learning_rate": 9.800999018094364e-06, "loss": 1.4197, "step": 19083 }, { "epoch": 0.52, "learning_rate": 9.800114686835335e-06, "loss": 1.3093, "step": 19084 }, { "epoch": 0.52, "learning_rate": 9.799230357140114e-06, "loss": 1.334, "step": 19085 }, { "epoch": 0.52, "learning_rate": 9.79834602901562e-06, "loss": 1.4678, "step": 19086 }, { "epoch": 0.52, "learning_rate": 9.797461702468771e-06, "loss": 1.187, "step": 19087 }, { "epoch": 0.52, "learning_rate": 9.796577377506488e-06, "loss": 1.4478, "step": 19088 }, { "epoch": 0.52, "learning_rate": 9.795693054135686e-06, "loss": 1.2542, "step": 19089 }, { "epoch": 0.52, "learning_rate": 9.794808732363289e-06, "loss": 1.2661, "step": 19090 }, { "epoch": 0.52, "learning_rate": 9.793924412196209e-06, "loss": 1.4399, "step": 19091 }, { "epoch": 0.52, "learning_rate": 9.793040093641365e-06, "loss": 1.4526, "step": 19092 }, { "epoch": 0.52, "learning_rate": 9.792155776705683e-06, "loss": 1.26, "step": 19093 }, { "epoch": 0.52, "learning_rate": 9.791271461396071e-06, "loss": 1.354, "step": 19094 }, { "epoch": 0.52, "learning_rate": 9.790387147719461e-06, "loss": 1.2219, "step": 19095 }, { "epoch": 0.52, "learning_rate": 9.789502835682755e-06, "loss": 1.3481, "step": 19096 }, { "epoch": 0.52, "learning_rate": 9.788618525292887e-06, "loss": 1.281, "step": 19097 }, { "epoch": 0.52, "learning_rate": 9.787734216556762e-06, "loss": 1.1729, "step": 19098 }, { "epoch": 0.52, "learning_rate": 9.78684990948131e-06, "loss": 1.3542, "step": 19099 }, { "epoch": 0.52, "learning_rate": 9.78596560407344e-06, "loss": 1.3086, "step": 19100 }, { "epoch": 0.52, "learning_rate": 9.785081300340079e-06, "loss": 1.7065, "step": 19101 }, { "epoch": 0.52, "learning_rate": 9.784196998288135e-06, "loss": 1.1909, "step": 19102 }, { "epoch": 0.52, "learning_rate": 9.783312697924538e-06, "loss": 1.2273, "step": 19103 }, { "epoch": 0.52, "learning_rate": 9.782428399256196e-06, "loss": 1.2847, "step": 19104 }, { "epoch": 0.52, "learning_rate": 9.781544102290036e-06, "loss": 1.3447, "step": 19105 }, { "epoch": 0.52, "learning_rate": 9.780659807032967e-06, "loss": 1.2175, "step": 19106 }, { "epoch": 0.52, "learning_rate": 9.779775513491916e-06, "loss": 1.3745, "step": 19107 }, { "epoch": 0.52, "learning_rate": 9.778891221673797e-06, "loss": 1.3022, "step": 19108 }, { "epoch": 0.52, "learning_rate": 9.77800693158553e-06, "loss": 1.2754, "step": 19109 }, { "epoch": 0.52, "learning_rate": 9.77712264323403e-06, "loss": 1.3574, "step": 19110 }, { "epoch": 0.52, "learning_rate": 9.77623835662622e-06, "loss": 1.2358, "step": 19111 }, { "epoch": 0.52, "learning_rate": 9.775354071769016e-06, "loss": 1.7344, "step": 19112 }, { "epoch": 0.52, "learning_rate": 9.774469788669334e-06, "loss": 1.5464, "step": 19113 }, { "epoch": 0.52, "learning_rate": 9.773585507334097e-06, "loss": 1.3103, "step": 19114 }, { "epoch": 0.52, "learning_rate": 9.772701227770219e-06, "loss": 1.2291, "step": 19115 }, { "epoch": 0.52, "learning_rate": 9.77181694998462e-06, "loss": 1.4451, "step": 19116 }, { "epoch": 0.52, "learning_rate": 9.770932673984217e-06, "loss": 1.2561, "step": 19117 }, { "epoch": 0.52, "learning_rate": 9.770048399775932e-06, "loss": 1.3411, "step": 19118 }, { "epoch": 0.52, "learning_rate": 9.769164127366677e-06, "loss": 1.3093, "step": 19119 }, { "epoch": 0.52, "learning_rate": 9.768279856763374e-06, "loss": 1.2683, "step": 19120 }, { "epoch": 0.52, "learning_rate": 9.76739558797294e-06, "loss": 1.302, "step": 19121 }, { "epoch": 0.52, "learning_rate": 9.766511321002294e-06, "loss": 1.2031, "step": 19122 }, { "epoch": 0.52, "learning_rate": 9.765627055858354e-06, "loss": 1.368, "step": 19123 }, { "epoch": 0.52, "learning_rate": 9.764742792548037e-06, "loss": 1.4077, "step": 19124 }, { "epoch": 0.52, "learning_rate": 9.763858531078264e-06, "loss": 1.3215, "step": 19125 }, { "epoch": 0.52, "learning_rate": 9.762974271455948e-06, "loss": 1.3257, "step": 19126 }, { "epoch": 0.52, "learning_rate": 9.762090013688012e-06, "loss": 1.2612, "step": 19127 }, { "epoch": 0.52, "learning_rate": 9.76120575778137e-06, "loss": 1.2869, "step": 19128 }, { "epoch": 0.52, "learning_rate": 9.760321503742945e-06, "loss": 1.2249, "step": 19129 }, { "epoch": 0.52, "learning_rate": 9.759437251579649e-06, "loss": 1.2534, "step": 19130 }, { "epoch": 0.52, "learning_rate": 9.758553001298405e-06, "loss": 1.7148, "step": 19131 }, { "epoch": 0.52, "learning_rate": 9.757668752906125e-06, "loss": 1.2246, "step": 19132 }, { "epoch": 0.52, "learning_rate": 9.756784506409734e-06, "loss": 1.3635, "step": 19133 }, { "epoch": 0.52, "learning_rate": 9.755900261816145e-06, "loss": 1.3428, "step": 19134 }, { "epoch": 0.52, "learning_rate": 9.75501601913228e-06, "loss": 1.3623, "step": 19135 }, { "epoch": 0.52, "learning_rate": 9.754131778365052e-06, "loss": 1.3318, "step": 19136 }, { "epoch": 0.52, "learning_rate": 9.753247539521382e-06, "loss": 1.3518, "step": 19137 }, { "epoch": 0.52, "learning_rate": 9.752363302608186e-06, "loss": 1.7817, "step": 19138 }, { "epoch": 0.52, "learning_rate": 9.751479067632381e-06, "loss": 1.3164, "step": 19139 }, { "epoch": 0.52, "learning_rate": 9.750594834600894e-06, "loss": 1.1807, "step": 19140 }, { "epoch": 0.52, "learning_rate": 9.74971060352063e-06, "loss": 1.3269, "step": 19141 }, { "epoch": 0.52, "learning_rate": 9.748826374398517e-06, "loss": 1.2632, "step": 19142 }, { "epoch": 0.52, "learning_rate": 9.747942147241462e-06, "loss": 1.2378, "step": 19143 }, { "epoch": 0.52, "learning_rate": 9.747057922056396e-06, "loss": 1.3079, "step": 19144 }, { "epoch": 0.52, "learning_rate": 9.746173698850225e-06, "loss": 1.2051, "step": 19145 }, { "epoch": 0.52, "learning_rate": 9.745289477629876e-06, "loss": 1.239, "step": 19146 }, { "epoch": 0.52, "learning_rate": 9.744405258402256e-06, "loss": 1.3193, "step": 19147 }, { "epoch": 0.52, "learning_rate": 9.743521041174297e-06, "loss": 1.3066, "step": 19148 }, { "epoch": 0.52, "learning_rate": 9.742636825952902e-06, "loss": 1.4956, "step": 19149 }, { "epoch": 0.52, "learning_rate": 9.741752612745002e-06, "loss": 1.3774, "step": 19150 }, { "epoch": 0.52, "learning_rate": 9.7408684015575e-06, "loss": 1.2366, "step": 19151 }, { "epoch": 0.52, "learning_rate": 9.73998419239733e-06, "loss": 1.3163, "step": 19152 }, { "epoch": 0.52, "learning_rate": 9.739099985271394e-06, "loss": 1.1718, "step": 19153 }, { "epoch": 0.52, "learning_rate": 9.73821578018662e-06, "loss": 1.3672, "step": 19154 }, { "epoch": 0.52, "learning_rate": 9.737331577149923e-06, "loss": 1.2742, "step": 19155 }, { "epoch": 0.52, "learning_rate": 9.73644737616822e-06, "loss": 1.2764, "step": 19156 }, { "epoch": 0.52, "learning_rate": 9.73556317724843e-06, "loss": 1.1204, "step": 19157 }, { "epoch": 0.52, "learning_rate": 9.734678980397467e-06, "loss": 1.3044, "step": 19158 }, { "epoch": 0.52, "learning_rate": 9.733794785622254e-06, "loss": 1.2336, "step": 19159 }, { "epoch": 0.52, "learning_rate": 9.732910592929702e-06, "loss": 1.3618, "step": 19160 }, { "epoch": 0.52, "learning_rate": 9.732026402326735e-06, "loss": 1.3528, "step": 19161 }, { "epoch": 0.52, "learning_rate": 9.731142213820266e-06, "loss": 1.0366, "step": 19162 }, { "epoch": 0.52, "learning_rate": 9.730258027417214e-06, "loss": 1.3721, "step": 19163 }, { "epoch": 0.52, "learning_rate": 9.729373843124497e-06, "loss": 1.2268, "step": 19164 }, { "epoch": 0.52, "learning_rate": 9.728489660949031e-06, "loss": 1.2246, "step": 19165 }, { "epoch": 0.52, "learning_rate": 9.727605480897733e-06, "loss": 1.3389, "step": 19166 }, { "epoch": 0.52, "learning_rate": 9.726721302977526e-06, "loss": 1.3914, "step": 19167 }, { "epoch": 0.52, "learning_rate": 9.725837127195318e-06, "loss": 1.2781, "step": 19168 }, { "epoch": 0.52, "learning_rate": 9.724952953558033e-06, "loss": 1.1794, "step": 19169 }, { "epoch": 0.52, "learning_rate": 9.724068782072588e-06, "loss": 1.2419, "step": 19170 }, { "epoch": 0.52, "learning_rate": 9.723184612745897e-06, "loss": 1.2605, "step": 19171 }, { "epoch": 0.52, "learning_rate": 9.722300445584882e-06, "loss": 1.2397, "step": 19172 }, { "epoch": 0.52, "learning_rate": 9.721416280596456e-06, "loss": 1.4419, "step": 19173 }, { "epoch": 0.52, "learning_rate": 9.720532117787538e-06, "loss": 1.2935, "step": 19174 }, { "epoch": 0.52, "learning_rate": 9.719647957165046e-06, "loss": 1.3193, "step": 19175 }, { "epoch": 0.52, "learning_rate": 9.718763798735897e-06, "loss": 1.2671, "step": 19176 }, { "epoch": 0.52, "learning_rate": 9.717879642507006e-06, "loss": 1.3074, "step": 19177 }, { "epoch": 0.52, "learning_rate": 9.716995488485295e-06, "loss": 1.3457, "step": 19178 }, { "epoch": 0.52, "learning_rate": 9.716111336677675e-06, "loss": 1.3792, "step": 19179 }, { "epoch": 0.52, "learning_rate": 9.715227187091069e-06, "loss": 1.2944, "step": 19180 }, { "epoch": 0.52, "learning_rate": 9.71434303973239e-06, "loss": 1.3882, "step": 19181 }, { "epoch": 0.52, "learning_rate": 9.713458894608558e-06, "loss": 1.321, "step": 19182 }, { "epoch": 0.52, "learning_rate": 9.712574751726485e-06, "loss": 1.2483, "step": 19183 }, { "epoch": 0.52, "learning_rate": 9.711690611093094e-06, "loss": 1.355, "step": 19184 }, { "epoch": 0.52, "learning_rate": 9.710806472715303e-06, "loss": 1.3582, "step": 19185 }, { "epoch": 0.52, "learning_rate": 9.709922336600021e-06, "loss": 1.208, "step": 19186 }, { "epoch": 0.52, "learning_rate": 9.709038202754177e-06, "loss": 1.3545, "step": 19187 }, { "epoch": 0.52, "learning_rate": 9.708154071184675e-06, "loss": 1.1705, "step": 19188 }, { "epoch": 0.52, "learning_rate": 9.707269941898445e-06, "loss": 1.4172, "step": 19189 }, { "epoch": 0.52, "learning_rate": 9.706385814902389e-06, "loss": 1.3054, "step": 19190 }, { "epoch": 0.52, "learning_rate": 9.70550169020344e-06, "loss": 1.0737, "step": 19191 }, { "epoch": 0.52, "learning_rate": 9.7046175678085e-06, "loss": 1.3408, "step": 19192 }, { "epoch": 0.52, "learning_rate": 9.703733447724501e-06, "loss": 1.3096, "step": 19193 }, { "epoch": 0.52, "learning_rate": 9.702849329958344e-06, "loss": 1.2424, "step": 19194 }, { "epoch": 0.52, "learning_rate": 9.701965214516963e-06, "loss": 1.3435, "step": 19195 }, { "epoch": 0.52, "learning_rate": 9.701081101407258e-06, "loss": 1.2898, "step": 19196 }, { "epoch": 0.52, "learning_rate": 9.700196990636162e-06, "loss": 1.2534, "step": 19197 }, { "epoch": 0.52, "learning_rate": 9.699312882210574e-06, "loss": 1.4177, "step": 19198 }, { "epoch": 0.52, "learning_rate": 9.69842877613743e-06, "loss": 1.0947, "step": 19199 }, { "epoch": 0.52, "learning_rate": 9.69754467242363e-06, "loss": 1.3772, "step": 19200 }, { "epoch": 0.52, "learning_rate": 9.6966605710761e-06, "loss": 1.3059, "step": 19201 }, { "epoch": 0.52, "learning_rate": 9.695776472101757e-06, "loss": 1.1353, "step": 19202 }, { "epoch": 0.52, "learning_rate": 9.694892375507516e-06, "loss": 1.3577, "step": 19203 }, { "epoch": 0.52, "learning_rate": 9.694008281300293e-06, "loss": 1.291, "step": 19204 }, { "epoch": 0.52, "learning_rate": 9.693124189487006e-06, "loss": 1.2656, "step": 19205 }, { "epoch": 0.52, "learning_rate": 9.69224010007457e-06, "loss": 1.2869, "step": 19206 }, { "epoch": 0.52, "learning_rate": 9.691356013069903e-06, "loss": 1.1677, "step": 19207 }, { "epoch": 0.52, "learning_rate": 9.690471928479923e-06, "loss": 1.238, "step": 19208 }, { "epoch": 0.52, "learning_rate": 9.689587846311542e-06, "loss": 1.2668, "step": 19209 }, { "epoch": 0.52, "learning_rate": 9.688703766571682e-06, "loss": 1.2144, "step": 19210 }, { "epoch": 0.52, "learning_rate": 9.687819689267256e-06, "loss": 1.24, "step": 19211 }, { "epoch": 0.52, "learning_rate": 9.686935614405183e-06, "loss": 1.248, "step": 19212 }, { "epoch": 0.52, "learning_rate": 9.686051541992378e-06, "loss": 1.1846, "step": 19213 }, { "epoch": 0.52, "learning_rate": 9.685167472035759e-06, "loss": 1.2866, "step": 19214 }, { "epoch": 0.52, "learning_rate": 9.68428340454224e-06, "loss": 1.3052, "step": 19215 }, { "epoch": 0.52, "learning_rate": 9.683399339518739e-06, "loss": 1.1807, "step": 19216 }, { "epoch": 0.52, "learning_rate": 9.682515276972174e-06, "loss": 1.2463, "step": 19217 }, { "epoch": 0.52, "learning_rate": 9.68163121690946e-06, "loss": 1.2334, "step": 19218 }, { "epoch": 0.52, "learning_rate": 9.680747159337515e-06, "loss": 1.2024, "step": 19219 }, { "epoch": 0.52, "learning_rate": 9.679863104263251e-06, "loss": 1.1848, "step": 19220 }, { "epoch": 0.52, "learning_rate": 9.67897905169359e-06, "loss": 1.2583, "step": 19221 }, { "epoch": 0.52, "learning_rate": 9.678095001635445e-06, "loss": 1.2986, "step": 19222 }, { "epoch": 0.52, "learning_rate": 9.677210954095733e-06, "loss": 1.1257, "step": 19223 }, { "epoch": 0.52, "learning_rate": 9.67632690908137e-06, "loss": 1.1795, "step": 19224 }, { "epoch": 0.53, "learning_rate": 9.675442866599277e-06, "loss": 1.1726, "step": 19225 }, { "epoch": 0.53, "learning_rate": 9.674558826656362e-06, "loss": 1.1365, "step": 19226 }, { "epoch": 0.53, "learning_rate": 9.673674789259548e-06, "loss": 1.3633, "step": 19227 }, { "epoch": 0.53, "learning_rate": 9.672790754415748e-06, "loss": 1.312, "step": 19228 }, { "epoch": 0.53, "learning_rate": 9.67190672213188e-06, "loss": 1.1106, "step": 19229 }, { "epoch": 0.53, "learning_rate": 9.671022692414858e-06, "loss": 1.1943, "step": 19230 }, { "epoch": 0.53, "learning_rate": 9.6701386652716e-06, "loss": 1.2854, "step": 19231 }, { "epoch": 0.53, "learning_rate": 9.669254640709025e-06, "loss": 1.2881, "step": 19232 }, { "epoch": 0.53, "learning_rate": 9.66837061873404e-06, "loss": 1.6377, "step": 19233 }, { "epoch": 0.53, "learning_rate": 9.667486599353575e-06, "loss": 1.3223, "step": 19234 }, { "epoch": 0.53, "learning_rate": 9.666602582574532e-06, "loss": 1.3975, "step": 19235 }, { "epoch": 0.53, "learning_rate": 9.66571856840384e-06, "loss": 1.3586, "step": 19236 }, { "epoch": 0.53, "learning_rate": 9.664834556848402e-06, "loss": 1.28, "step": 19237 }, { "epoch": 0.53, "learning_rate": 9.663950547915145e-06, "loss": 1.4099, "step": 19238 }, { "epoch": 0.53, "learning_rate": 9.663066541610979e-06, "loss": 1.2661, "step": 19239 }, { "epoch": 0.53, "learning_rate": 9.662182537942823e-06, "loss": 1.3037, "step": 19240 }, { "epoch": 0.53, "learning_rate": 9.661298536917592e-06, "loss": 1.3, "step": 19241 }, { "epoch": 0.53, "learning_rate": 9.660414538542203e-06, "loss": 1.1936, "step": 19242 }, { "epoch": 0.53, "learning_rate": 9.659530542823568e-06, "loss": 1.304, "step": 19243 }, { "epoch": 0.53, "learning_rate": 9.65864654976861e-06, "loss": 1.2988, "step": 19244 }, { "epoch": 0.53, "learning_rate": 9.657762559384237e-06, "loss": 1.3804, "step": 19245 }, { "epoch": 0.53, "learning_rate": 9.65687857167737e-06, "loss": 1.2335, "step": 19246 }, { "epoch": 0.53, "learning_rate": 9.655994586654925e-06, "loss": 1.4131, "step": 19247 }, { "epoch": 0.53, "learning_rate": 9.655110604323814e-06, "loss": 1.2019, "step": 19248 }, { "epoch": 0.53, "learning_rate": 9.654226624690958e-06, "loss": 1.2852, "step": 19249 }, { "epoch": 0.53, "learning_rate": 9.65334264776327e-06, "loss": 1.2874, "step": 19250 }, { "epoch": 0.53, "learning_rate": 9.652458673547667e-06, "loss": 1.2827, "step": 19251 }, { "epoch": 0.53, "learning_rate": 9.65157470205106e-06, "loss": 1.2905, "step": 19252 }, { "epoch": 0.53, "learning_rate": 9.650690733280373e-06, "loss": 1.3555, "step": 19253 }, { "epoch": 0.53, "learning_rate": 9.649806767242515e-06, "loss": 1.408, "step": 19254 }, { "epoch": 0.53, "learning_rate": 9.648922803944405e-06, "loss": 1.21, "step": 19255 }, { "epoch": 0.53, "learning_rate": 9.648038843392957e-06, "loss": 1.2883, "step": 19256 }, { "epoch": 0.53, "learning_rate": 9.647154885595088e-06, "loss": 1.2104, "step": 19257 }, { "epoch": 0.53, "learning_rate": 9.646270930557713e-06, "loss": 1.1189, "step": 19258 }, { "epoch": 0.53, "learning_rate": 9.64538697828775e-06, "loss": 1.2417, "step": 19259 }, { "epoch": 0.53, "learning_rate": 9.64450302879211e-06, "loss": 1.2229, "step": 19260 }, { "epoch": 0.53, "learning_rate": 9.643619082077713e-06, "loss": 1.2925, "step": 19261 }, { "epoch": 0.53, "learning_rate": 9.642735138151473e-06, "loss": 1.2822, "step": 19262 }, { "epoch": 0.53, "learning_rate": 9.641851197020302e-06, "loss": 1.3638, "step": 19263 }, { "epoch": 0.53, "learning_rate": 9.640967258691122e-06, "loss": 1.2944, "step": 19264 }, { "epoch": 0.53, "learning_rate": 9.640083323170843e-06, "loss": 1.0417, "step": 19265 }, { "epoch": 0.53, "learning_rate": 9.639199390466384e-06, "loss": 1.3005, "step": 19266 }, { "epoch": 0.53, "learning_rate": 9.63831546058466e-06, "loss": 1.1553, "step": 19267 }, { "epoch": 0.53, "learning_rate": 9.637431533532586e-06, "loss": 1.1357, "step": 19268 }, { "epoch": 0.53, "learning_rate": 9.636547609317074e-06, "loss": 1.1775, "step": 19269 }, { "epoch": 0.53, "learning_rate": 9.635663687945047e-06, "loss": 1.2617, "step": 19270 }, { "epoch": 0.53, "learning_rate": 9.634779769423412e-06, "loss": 1.4175, "step": 19271 }, { "epoch": 0.53, "learning_rate": 9.633895853759093e-06, "loss": 1.3591, "step": 19272 }, { "epoch": 0.53, "learning_rate": 9.633011940958995e-06, "loss": 1.3418, "step": 19273 }, { "epoch": 0.53, "learning_rate": 9.632128031030044e-06, "loss": 1.29, "step": 19274 }, { "epoch": 0.53, "learning_rate": 9.631244123979146e-06, "loss": 1.3276, "step": 19275 }, { "epoch": 0.53, "learning_rate": 9.630360219813226e-06, "loss": 1.3523, "step": 19276 }, { "epoch": 0.53, "learning_rate": 9.629476318539189e-06, "loss": 1.2676, "step": 19277 }, { "epoch": 0.53, "learning_rate": 9.628592420163954e-06, "loss": 1.0835, "step": 19278 }, { "epoch": 0.53, "learning_rate": 9.627708524694442e-06, "loss": 1.3394, "step": 19279 }, { "epoch": 0.53, "learning_rate": 9.626824632137561e-06, "loss": 1.1379, "step": 19280 }, { "epoch": 0.53, "learning_rate": 9.62594074250023e-06, "loss": 1.1951, "step": 19281 }, { "epoch": 0.53, "learning_rate": 9.62505685578936e-06, "loss": 1.3684, "step": 19282 }, { "epoch": 0.53, "learning_rate": 9.624172972011871e-06, "loss": 1.1482, "step": 19283 }, { "epoch": 0.53, "learning_rate": 9.623289091174675e-06, "loss": 1.6589, "step": 19284 }, { "epoch": 0.53, "learning_rate": 9.62240521328469e-06, "loss": 1.2688, "step": 19285 }, { "epoch": 0.53, "learning_rate": 9.621521338348827e-06, "loss": 1.2258, "step": 19286 }, { "epoch": 0.53, "learning_rate": 9.620637466374005e-06, "loss": 1.3003, "step": 19287 }, { "epoch": 0.53, "learning_rate": 9.619753597367134e-06, "loss": 1.6934, "step": 19288 }, { "epoch": 0.53, "learning_rate": 9.618869731335135e-06, "loss": 1.4292, "step": 19289 }, { "epoch": 0.53, "learning_rate": 9.617985868284918e-06, "loss": 1.3098, "step": 19290 }, { "epoch": 0.53, "learning_rate": 9.617102008223403e-06, "loss": 1.2175, "step": 19291 }, { "epoch": 0.53, "learning_rate": 9.616218151157497e-06, "loss": 1.3506, "step": 19292 }, { "epoch": 0.53, "learning_rate": 9.615334297094122e-06, "loss": 1.3423, "step": 19293 }, { "epoch": 0.53, "learning_rate": 9.614450446040192e-06, "loss": 1.356, "step": 19294 }, { "epoch": 0.53, "learning_rate": 9.613566598002619e-06, "loss": 1.2629, "step": 19295 }, { "epoch": 0.53, "learning_rate": 9.61268275298832e-06, "loss": 1.2288, "step": 19296 }, { "epoch": 0.53, "learning_rate": 9.611798911004207e-06, "loss": 1.3733, "step": 19297 }, { "epoch": 0.53, "learning_rate": 9.6109150720572e-06, "loss": 1.271, "step": 19298 }, { "epoch": 0.53, "learning_rate": 9.610031236154206e-06, "loss": 1.3506, "step": 19299 }, { "epoch": 0.53, "learning_rate": 9.609147403302149e-06, "loss": 1.2256, "step": 19300 }, { "epoch": 0.53, "learning_rate": 9.608263573507936e-06, "loss": 1.3798, "step": 19301 }, { "epoch": 0.53, "learning_rate": 9.607379746778487e-06, "loss": 1.2454, "step": 19302 }, { "epoch": 0.53, "learning_rate": 9.606495923120712e-06, "loss": 1.3503, "step": 19303 }, { "epoch": 0.53, "learning_rate": 9.60561210254153e-06, "loss": 1.3057, "step": 19304 }, { "epoch": 0.53, "learning_rate": 9.60472828504785e-06, "loss": 1.22, "step": 19305 }, { "epoch": 0.53, "learning_rate": 9.603844470646594e-06, "loss": 1.1694, "step": 19306 }, { "epoch": 0.53, "learning_rate": 9.60296065934467e-06, "loss": 1.3701, "step": 19307 }, { "epoch": 0.53, "learning_rate": 9.602076851148992e-06, "loss": 1.6865, "step": 19308 }, { "epoch": 0.53, "learning_rate": 9.601193046066485e-06, "loss": 1.3354, "step": 19309 }, { "epoch": 0.53, "learning_rate": 9.60030924410405e-06, "loss": 1.2361, "step": 19310 }, { "epoch": 0.53, "learning_rate": 9.599425445268613e-06, "loss": 1.272, "step": 19311 }, { "epoch": 0.53, "learning_rate": 9.598541649567077e-06, "loss": 1.0608, "step": 19312 }, { "epoch": 0.53, "learning_rate": 9.597657857006368e-06, "loss": 1.2886, "step": 19313 }, { "epoch": 0.53, "learning_rate": 9.59677406759339e-06, "loss": 1.3569, "step": 19314 }, { "epoch": 0.53, "learning_rate": 9.595890281335066e-06, "loss": 1.2234, "step": 19315 }, { "epoch": 0.53, "learning_rate": 9.595006498238302e-06, "loss": 1.1489, "step": 19316 }, { "epoch": 0.53, "learning_rate": 9.594122718310023e-06, "loss": 1.2061, "step": 19317 }, { "epoch": 0.53, "learning_rate": 9.59323894155713e-06, "loss": 1.3733, "step": 19318 }, { "epoch": 0.53, "learning_rate": 9.59235516798655e-06, "loss": 1.3008, "step": 19319 }, { "epoch": 0.53, "learning_rate": 9.591471397605187e-06, "loss": 1.291, "step": 19320 }, { "epoch": 0.53, "learning_rate": 9.590587630419964e-06, "loss": 1.2893, "step": 19321 }, { "epoch": 0.53, "learning_rate": 9.589703866437787e-06, "loss": 1.3525, "step": 19322 }, { "epoch": 0.53, "learning_rate": 9.588820105665576e-06, "loss": 1.2764, "step": 19323 }, { "epoch": 0.53, "learning_rate": 9.587936348110242e-06, "loss": 1.3743, "step": 19324 }, { "epoch": 0.53, "learning_rate": 9.587052593778699e-06, "loss": 1.3513, "step": 19325 }, { "epoch": 0.53, "learning_rate": 9.586168842677865e-06, "loss": 1.3282, "step": 19326 }, { "epoch": 0.53, "learning_rate": 9.58528509481465e-06, "loss": 1.353, "step": 19327 }, { "epoch": 0.53, "learning_rate": 9.58440135019597e-06, "loss": 1.3318, "step": 19328 }, { "epoch": 0.53, "learning_rate": 9.583517608828738e-06, "loss": 1.3474, "step": 19329 }, { "epoch": 0.53, "learning_rate": 9.58263387071987e-06, "loss": 1.3218, "step": 19330 }, { "epoch": 0.53, "learning_rate": 9.581750135876277e-06, "loss": 1.304, "step": 19331 }, { "epoch": 0.53, "learning_rate": 9.580866404304876e-06, "loss": 1.3359, "step": 19332 }, { "epoch": 0.53, "learning_rate": 9.579982676012576e-06, "loss": 1.2791, "step": 19333 }, { "epoch": 0.53, "learning_rate": 9.579098951006296e-06, "loss": 1.7373, "step": 19334 }, { "epoch": 0.53, "learning_rate": 9.578215229292947e-06, "loss": 1.3523, "step": 19335 }, { "epoch": 0.53, "learning_rate": 9.577331510879445e-06, "loss": 1.2634, "step": 19336 }, { "epoch": 0.53, "learning_rate": 9.576447795772703e-06, "loss": 1.3096, "step": 19337 }, { "epoch": 0.53, "learning_rate": 9.575564083979632e-06, "loss": 1.0383, "step": 19338 }, { "epoch": 0.53, "learning_rate": 9.574680375507148e-06, "loss": 1.4409, "step": 19339 }, { "epoch": 0.53, "learning_rate": 9.573796670362165e-06, "loss": 1.168, "step": 19340 }, { "epoch": 0.53, "learning_rate": 9.572912968551598e-06, "loss": 1.2615, "step": 19341 }, { "epoch": 0.53, "learning_rate": 9.572029270082358e-06, "loss": 1.283, "step": 19342 }, { "epoch": 0.53, "learning_rate": 9.571145574961362e-06, "loss": 1.27, "step": 19343 }, { "epoch": 0.53, "learning_rate": 9.570261883195517e-06, "loss": 1.2363, "step": 19344 }, { "epoch": 0.53, "learning_rate": 9.569378194791745e-06, "loss": 1.3042, "step": 19345 }, { "epoch": 0.53, "learning_rate": 9.568494509756954e-06, "loss": 1.3472, "step": 19346 }, { "epoch": 0.53, "learning_rate": 9.56761082809806e-06, "loss": 1.2317, "step": 19347 }, { "epoch": 0.53, "learning_rate": 9.566727149821973e-06, "loss": 1.3147, "step": 19348 }, { "epoch": 0.53, "learning_rate": 9.56584347493561e-06, "loss": 1.2295, "step": 19349 }, { "epoch": 0.53, "learning_rate": 9.564959803445884e-06, "loss": 1.4624, "step": 19350 }, { "epoch": 0.53, "learning_rate": 9.56407613535971e-06, "loss": 1.79, "step": 19351 }, { "epoch": 0.53, "learning_rate": 9.563192470683996e-06, "loss": 1.293, "step": 19352 }, { "epoch": 0.53, "learning_rate": 9.56230880942566e-06, "loss": 1.2539, "step": 19353 }, { "epoch": 0.53, "learning_rate": 9.561425151591614e-06, "loss": 1.165, "step": 19354 }, { "epoch": 0.53, "learning_rate": 9.560541497188768e-06, "loss": 1.1837, "step": 19355 }, { "epoch": 0.53, "learning_rate": 9.559657846224046e-06, "loss": 1.397, "step": 19356 }, { "epoch": 0.53, "learning_rate": 9.558774198704347e-06, "loss": 1.2778, "step": 19357 }, { "epoch": 0.53, "learning_rate": 9.557890554636598e-06, "loss": 1.1555, "step": 19358 }, { "epoch": 0.53, "learning_rate": 9.557006914027698e-06, "loss": 1.3503, "step": 19359 }, { "epoch": 0.53, "learning_rate": 9.556123276884575e-06, "loss": 1.3828, "step": 19360 }, { "epoch": 0.53, "learning_rate": 9.555239643214128e-06, "loss": 1.3809, "step": 19361 }, { "epoch": 0.53, "learning_rate": 9.554356013023283e-06, "loss": 1.3635, "step": 19362 }, { "epoch": 0.53, "learning_rate": 9.55347238631894e-06, "loss": 1.2817, "step": 19363 }, { "epoch": 0.53, "learning_rate": 9.552588763108026e-06, "loss": 1.2488, "step": 19364 }, { "epoch": 0.53, "learning_rate": 9.551705143397442e-06, "loss": 1.2224, "step": 19365 }, { "epoch": 0.53, "learning_rate": 9.55082152719411e-06, "loss": 1.3933, "step": 19366 }, { "epoch": 0.53, "learning_rate": 9.549937914504935e-06, "loss": 1.2043, "step": 19367 }, { "epoch": 0.53, "learning_rate": 9.54905430533684e-06, "loss": 1.3577, "step": 19368 }, { "epoch": 0.53, "learning_rate": 9.548170699696725e-06, "loss": 1.3403, "step": 19369 }, { "epoch": 0.53, "learning_rate": 9.547287097591513e-06, "loss": 1.7075, "step": 19370 }, { "epoch": 0.53, "learning_rate": 9.546403499028115e-06, "loss": 1.364, "step": 19371 }, { "epoch": 0.53, "learning_rate": 9.545519904013442e-06, "loss": 1.0752, "step": 19372 }, { "epoch": 0.53, "learning_rate": 9.544636312554409e-06, "loss": 1.46, "step": 19373 }, { "epoch": 0.53, "learning_rate": 9.543752724657924e-06, "loss": 1.2942, "step": 19374 }, { "epoch": 0.53, "learning_rate": 9.542869140330908e-06, "loss": 1.4221, "step": 19375 }, { "epoch": 0.53, "learning_rate": 9.541985559580265e-06, "loss": 1.2028, "step": 19376 }, { "epoch": 0.53, "learning_rate": 9.541101982412912e-06, "loss": 1.1245, "step": 19377 }, { "epoch": 0.53, "learning_rate": 9.540218408835761e-06, "loss": 1.4922, "step": 19378 }, { "epoch": 0.53, "learning_rate": 9.539334838855728e-06, "loss": 1.2405, "step": 19379 }, { "epoch": 0.53, "learning_rate": 9.53845127247972e-06, "loss": 1.2609, "step": 19380 }, { "epoch": 0.53, "learning_rate": 9.537567709714654e-06, "loss": 1.3088, "step": 19381 }, { "epoch": 0.53, "learning_rate": 9.536684150567438e-06, "loss": 1.3875, "step": 19382 }, { "epoch": 0.53, "learning_rate": 9.53580059504499e-06, "loss": 1.2227, "step": 19383 }, { "epoch": 0.53, "learning_rate": 9.534917043154219e-06, "loss": 1.1709, "step": 19384 }, { "epoch": 0.53, "learning_rate": 9.534033494902038e-06, "loss": 1.2949, "step": 19385 }, { "epoch": 0.53, "learning_rate": 9.53314995029536e-06, "loss": 1.2551, "step": 19386 }, { "epoch": 0.53, "learning_rate": 9.532266409341095e-06, "loss": 1.3545, "step": 19387 }, { "epoch": 0.53, "learning_rate": 9.531382872046163e-06, "loss": 1.2185, "step": 19388 }, { "epoch": 0.53, "learning_rate": 9.530499338417466e-06, "loss": 1.2217, "step": 19389 }, { "epoch": 0.53, "learning_rate": 9.529615808461923e-06, "loss": 1.312, "step": 19390 }, { "epoch": 0.53, "learning_rate": 9.528732282186446e-06, "loss": 1.3264, "step": 19391 }, { "epoch": 0.53, "learning_rate": 9.527848759597946e-06, "loss": 1.3396, "step": 19392 }, { "epoch": 0.53, "learning_rate": 9.526965240703333e-06, "loss": 1.2209, "step": 19393 }, { "epoch": 0.53, "learning_rate": 9.526081725509523e-06, "loss": 1.3245, "step": 19394 }, { "epoch": 0.53, "learning_rate": 9.525198214023426e-06, "loss": 1.187, "step": 19395 }, { "epoch": 0.53, "learning_rate": 9.524314706251958e-06, "loss": 1.3806, "step": 19396 }, { "epoch": 0.53, "learning_rate": 9.523431202202024e-06, "loss": 1.3647, "step": 19397 }, { "epoch": 0.53, "learning_rate": 9.522547701880542e-06, "loss": 1.2908, "step": 19398 }, { "epoch": 0.53, "learning_rate": 9.521664205294422e-06, "loss": 1.5713, "step": 19399 }, { "epoch": 0.53, "learning_rate": 9.520780712450577e-06, "loss": 1.4631, "step": 19400 }, { "epoch": 0.53, "learning_rate": 9.519897223355917e-06, "loss": 1.1257, "step": 19401 }, { "epoch": 0.53, "learning_rate": 9.519013738017353e-06, "loss": 1.2856, "step": 19402 }, { "epoch": 0.53, "learning_rate": 9.518130256441805e-06, "loss": 1.3516, "step": 19403 }, { "epoch": 0.53, "learning_rate": 9.517246778636174e-06, "loss": 1.4551, "step": 19404 }, { "epoch": 0.53, "learning_rate": 9.516363304607383e-06, "loss": 1.2012, "step": 19405 }, { "epoch": 0.53, "learning_rate": 9.515479834362332e-06, "loss": 1.2793, "step": 19406 }, { "epoch": 0.53, "learning_rate": 9.514596367907945e-06, "loss": 1.2383, "step": 19407 }, { "epoch": 0.53, "learning_rate": 9.513712905251122e-06, "loss": 1.3381, "step": 19408 }, { "epoch": 0.53, "learning_rate": 9.512829446398787e-06, "loss": 1.3384, "step": 19409 }, { "epoch": 0.53, "learning_rate": 9.511945991357838e-06, "loss": 1.3711, "step": 19410 }, { "epoch": 0.53, "learning_rate": 9.511062540135201e-06, "loss": 1.3398, "step": 19411 }, { "epoch": 0.53, "learning_rate": 9.510179092737775e-06, "loss": 1.6987, "step": 19412 }, { "epoch": 0.53, "learning_rate": 9.509295649172483e-06, "loss": 1.2263, "step": 19413 }, { "epoch": 0.53, "learning_rate": 9.508412209446225e-06, "loss": 1.3877, "step": 19414 }, { "epoch": 0.53, "learning_rate": 9.507528773565924e-06, "loss": 1.2468, "step": 19415 }, { "epoch": 0.53, "learning_rate": 9.506645341538482e-06, "loss": 1.3928, "step": 19416 }, { "epoch": 0.53, "learning_rate": 9.505761913370814e-06, "loss": 1.3577, "step": 19417 }, { "epoch": 0.53, "learning_rate": 9.504878489069838e-06, "loss": 1.0943, "step": 19418 }, { "epoch": 0.53, "learning_rate": 9.503995068642456e-06, "loss": 1.324, "step": 19419 }, { "epoch": 0.53, "learning_rate": 9.503111652095584e-06, "loss": 1.2295, "step": 19420 }, { "epoch": 0.53, "learning_rate": 9.502228239436133e-06, "loss": 1.3259, "step": 19421 }, { "epoch": 0.53, "learning_rate": 9.501344830671015e-06, "loss": 1.2886, "step": 19422 }, { "epoch": 0.53, "learning_rate": 9.500461425807139e-06, "loss": 1.2449, "step": 19423 }, { "epoch": 0.53, "learning_rate": 9.499578024851421e-06, "loss": 1.2031, "step": 19424 }, { "epoch": 0.53, "learning_rate": 9.498694627810766e-06, "loss": 1.2322, "step": 19425 }, { "epoch": 0.53, "learning_rate": 9.49781123469209e-06, "loss": 1.3879, "step": 19426 }, { "epoch": 0.53, "learning_rate": 9.496927845502302e-06, "loss": 1.2795, "step": 19427 }, { "epoch": 0.53, "learning_rate": 9.496044460248315e-06, "loss": 1.3225, "step": 19428 }, { "epoch": 0.53, "learning_rate": 9.495161078937037e-06, "loss": 1.3945, "step": 19429 }, { "epoch": 0.53, "learning_rate": 9.494277701575385e-06, "loss": 1.3418, "step": 19430 }, { "epoch": 0.53, "learning_rate": 9.493394328170264e-06, "loss": 1.2756, "step": 19431 }, { "epoch": 0.53, "learning_rate": 9.492510958728585e-06, "loss": 1.4121, "step": 19432 }, { "epoch": 0.53, "learning_rate": 9.491627593257266e-06, "loss": 1.2727, "step": 19433 }, { "epoch": 0.53, "learning_rate": 9.490744231763211e-06, "loss": 1.3135, "step": 19434 }, { "epoch": 0.53, "learning_rate": 9.489860874253336e-06, "loss": 1.2742, "step": 19435 }, { "epoch": 0.53, "learning_rate": 9.488977520734549e-06, "loss": 1.2461, "step": 19436 }, { "epoch": 0.53, "learning_rate": 9.488094171213761e-06, "loss": 1.1169, "step": 19437 }, { "epoch": 0.53, "learning_rate": 9.487210825697882e-06, "loss": 1.4253, "step": 19438 }, { "epoch": 0.53, "learning_rate": 9.486327484193828e-06, "loss": 1.2798, "step": 19439 }, { "epoch": 0.53, "learning_rate": 9.485444146708503e-06, "loss": 1.3354, "step": 19440 }, { "epoch": 0.53, "learning_rate": 9.484560813248823e-06, "loss": 1.3445, "step": 19441 }, { "epoch": 0.53, "learning_rate": 9.483677483821695e-06, "loss": 1.3315, "step": 19442 }, { "epoch": 0.53, "learning_rate": 9.482794158434034e-06, "loss": 1.2517, "step": 19443 }, { "epoch": 0.53, "learning_rate": 9.481910837092745e-06, "loss": 1.7383, "step": 19444 }, { "epoch": 0.53, "learning_rate": 9.481027519804745e-06, "loss": 1.3057, "step": 19445 }, { "epoch": 0.53, "learning_rate": 9.48014420657694e-06, "loss": 1.4626, "step": 19446 }, { "epoch": 0.53, "learning_rate": 9.479260897416244e-06, "loss": 1.1526, "step": 19447 }, { "epoch": 0.53, "learning_rate": 9.478377592329563e-06, "loss": 1.3035, "step": 19448 }, { "epoch": 0.53, "learning_rate": 9.477494291323808e-06, "loss": 1.3706, "step": 19449 }, { "epoch": 0.53, "learning_rate": 9.4766109944059e-06, "loss": 1.4111, "step": 19450 }, { "epoch": 0.53, "learning_rate": 9.475727701582733e-06, "loss": 1.3821, "step": 19451 }, { "epoch": 0.53, "learning_rate": 9.474844412861234e-06, "loss": 1.1746, "step": 19452 }, { "epoch": 0.53, "learning_rate": 9.473961128248299e-06, "loss": 1.3457, "step": 19453 }, { "epoch": 0.53, "learning_rate": 9.473077847750851e-06, "loss": 1.1599, "step": 19454 }, { "epoch": 0.53, "learning_rate": 9.472194571375787e-06, "loss": 1.2039, "step": 19455 }, { "epoch": 0.53, "learning_rate": 9.471311299130031e-06, "loss": 1.2766, "step": 19456 }, { "epoch": 0.53, "learning_rate": 9.470428031020483e-06, "loss": 1.2104, "step": 19457 }, { "epoch": 0.53, "learning_rate": 9.46954476705406e-06, "loss": 1.3108, "step": 19458 }, { "epoch": 0.53, "learning_rate": 9.468661507237664e-06, "loss": 1.2871, "step": 19459 }, { "epoch": 0.53, "learning_rate": 9.467778251578217e-06, "loss": 1.1841, "step": 19460 }, { "epoch": 0.53, "learning_rate": 9.466895000082617e-06, "loss": 1.3169, "step": 19461 }, { "epoch": 0.53, "learning_rate": 9.466011752757786e-06, "loss": 1.2908, "step": 19462 }, { "epoch": 0.53, "learning_rate": 9.46512850961062e-06, "loss": 1.3796, "step": 19463 }, { "epoch": 0.53, "learning_rate": 9.46424527064804e-06, "loss": 1.3792, "step": 19464 }, { "epoch": 0.53, "learning_rate": 9.463362035876956e-06, "loss": 1.1499, "step": 19465 }, { "epoch": 0.53, "learning_rate": 9.462478805304273e-06, "loss": 1.2676, "step": 19466 }, { "epoch": 0.53, "learning_rate": 9.461595578936905e-06, "loss": 1.3306, "step": 19467 }, { "epoch": 0.53, "learning_rate": 9.460712356781757e-06, "loss": 1.1741, "step": 19468 }, { "epoch": 0.53, "learning_rate": 9.459829138845744e-06, "loss": 1.4973, "step": 19469 }, { "epoch": 0.53, "learning_rate": 9.458945925135773e-06, "loss": 1.2893, "step": 19470 }, { "epoch": 0.53, "learning_rate": 9.458062715658755e-06, "loss": 1.3982, "step": 19471 }, { "epoch": 0.53, "learning_rate": 9.457179510421599e-06, "loss": 1.2625, "step": 19472 }, { "epoch": 0.53, "learning_rate": 9.456296309431217e-06, "loss": 1.3572, "step": 19473 }, { "epoch": 0.53, "learning_rate": 9.455413112694515e-06, "loss": 1.1577, "step": 19474 }, { "epoch": 0.53, "learning_rate": 9.454529920218407e-06, "loss": 1.3474, "step": 19475 }, { "epoch": 0.53, "learning_rate": 9.453646732009796e-06, "loss": 1.269, "step": 19476 }, { "epoch": 0.53, "learning_rate": 9.4527635480756e-06, "loss": 1.3862, "step": 19477 }, { "epoch": 0.53, "learning_rate": 9.451880368422724e-06, "loss": 1.3225, "step": 19478 }, { "epoch": 0.53, "learning_rate": 9.450997193058075e-06, "loss": 1.1826, "step": 19479 }, { "epoch": 0.53, "learning_rate": 9.450114021988572e-06, "loss": 1.2595, "step": 19480 }, { "epoch": 0.53, "learning_rate": 9.449230855221113e-06, "loss": 1.3369, "step": 19481 }, { "epoch": 0.53, "learning_rate": 9.448347692762616e-06, "loss": 1.2935, "step": 19482 }, { "epoch": 0.53, "learning_rate": 9.447464534619985e-06, "loss": 1.4392, "step": 19483 }, { "epoch": 0.53, "learning_rate": 9.446581380800135e-06, "loss": 1.2302, "step": 19484 }, { "epoch": 0.53, "learning_rate": 9.445698231309968e-06, "loss": 1.7324, "step": 19485 }, { "epoch": 0.53, "learning_rate": 9.4448150861564e-06, "loss": 1.2139, "step": 19486 }, { "epoch": 0.53, "learning_rate": 9.443931945346334e-06, "loss": 1.2761, "step": 19487 }, { "epoch": 0.53, "learning_rate": 9.443048808886689e-06, "loss": 1.1663, "step": 19488 }, { "epoch": 0.53, "learning_rate": 9.442165676784363e-06, "loss": 1.3054, "step": 19489 }, { "epoch": 0.53, "learning_rate": 9.441282549046273e-06, "loss": 1.2974, "step": 19490 }, { "epoch": 0.53, "learning_rate": 9.440399425679324e-06, "loss": 1.3323, "step": 19491 }, { "epoch": 0.53, "learning_rate": 9.439516306690429e-06, "loss": 1.2471, "step": 19492 }, { "epoch": 0.53, "learning_rate": 9.438633192086493e-06, "loss": 1.1721, "step": 19493 }, { "epoch": 0.53, "learning_rate": 9.437750081874424e-06, "loss": 1.2109, "step": 19494 }, { "epoch": 0.53, "learning_rate": 9.43686697606114e-06, "loss": 1.1638, "step": 19495 }, { "epoch": 0.53, "learning_rate": 9.435983874653539e-06, "loss": 1.335, "step": 19496 }, { "epoch": 0.53, "learning_rate": 9.43510077765854e-06, "loss": 1.2688, "step": 19497 }, { "epoch": 0.53, "learning_rate": 9.434217685083043e-06, "loss": 1.2209, "step": 19498 }, { "epoch": 0.53, "learning_rate": 9.433334596933965e-06, "loss": 1.1968, "step": 19499 }, { "epoch": 0.53, "learning_rate": 9.432451513218204e-06, "loss": 1.3916, "step": 19500 }, { "epoch": 0.53, "learning_rate": 9.431568433942682e-06, "loss": 1.2566, "step": 19501 }, { "epoch": 0.53, "learning_rate": 9.430685359114295e-06, "loss": 1.2756, "step": 19502 }, { "epoch": 0.53, "learning_rate": 9.429802288739963e-06, "loss": 1.3245, "step": 19503 }, { "epoch": 0.53, "learning_rate": 9.428919222826588e-06, "loss": 1.1995, "step": 19504 }, { "epoch": 0.53, "learning_rate": 9.428036161381083e-06, "loss": 1.28, "step": 19505 }, { "epoch": 0.53, "learning_rate": 9.42715310441035e-06, "loss": 1.3433, "step": 19506 }, { "epoch": 0.53, "learning_rate": 9.426270051921305e-06, "loss": 1.2559, "step": 19507 }, { "epoch": 0.53, "learning_rate": 9.42538700392085e-06, "loss": 1.3555, "step": 19508 }, { "epoch": 0.53, "learning_rate": 9.424503960415901e-06, "loss": 1.304, "step": 19509 }, { "epoch": 0.53, "learning_rate": 9.423620921413359e-06, "loss": 1.324, "step": 19510 }, { "epoch": 0.53, "learning_rate": 9.422737886920135e-06, "loss": 1.335, "step": 19511 }, { "epoch": 0.53, "learning_rate": 9.421854856943142e-06, "loss": 1.2626, "step": 19512 }, { "epoch": 0.53, "learning_rate": 9.420971831489282e-06, "loss": 1.1746, "step": 19513 }, { "epoch": 0.53, "learning_rate": 9.420088810565469e-06, "loss": 1.2488, "step": 19514 }, { "epoch": 0.53, "learning_rate": 9.419205794178605e-06, "loss": 1.1562, "step": 19515 }, { "epoch": 0.53, "learning_rate": 9.418322782335605e-06, "loss": 1.3127, "step": 19516 }, { "epoch": 0.53, "learning_rate": 9.41743977504337e-06, "loss": 1.3042, "step": 19517 }, { "epoch": 0.53, "learning_rate": 9.416556772308817e-06, "loss": 1.2913, "step": 19518 }, { "epoch": 0.53, "learning_rate": 9.415673774138847e-06, "loss": 1.2605, "step": 19519 }, { "epoch": 0.53, "learning_rate": 9.414790780540372e-06, "loss": 1.1855, "step": 19520 }, { "epoch": 0.53, "learning_rate": 9.413907791520296e-06, "loss": 1.0637, "step": 19521 }, { "epoch": 0.53, "learning_rate": 9.413024807085532e-06, "loss": 1.3738, "step": 19522 }, { "epoch": 0.53, "learning_rate": 9.412141827242986e-06, "loss": 1.563, "step": 19523 }, { "epoch": 0.53, "learning_rate": 9.411258851999565e-06, "loss": 1.3174, "step": 19524 }, { "epoch": 0.53, "learning_rate": 9.410375881362178e-06, "loss": 1.2278, "step": 19525 }, { "epoch": 0.53, "learning_rate": 9.409492915337732e-06, "loss": 1.3425, "step": 19526 }, { "epoch": 0.53, "learning_rate": 9.408609953933138e-06, "loss": 1.3005, "step": 19527 }, { "epoch": 0.53, "learning_rate": 9.4077269971553e-06, "loss": 1.4004, "step": 19528 }, { "epoch": 0.53, "learning_rate": 9.406844045011127e-06, "loss": 1.2388, "step": 19529 }, { "epoch": 0.53, "learning_rate": 9.405961097507527e-06, "loss": 1.2258, "step": 19530 }, { "epoch": 0.53, "learning_rate": 9.405078154651412e-06, "loss": 1.2698, "step": 19531 }, { "epoch": 0.53, "learning_rate": 9.404195216449681e-06, "loss": 1.282, "step": 19532 }, { "epoch": 0.53, "learning_rate": 9.40331228290925e-06, "loss": 1.312, "step": 19533 }, { "epoch": 0.53, "learning_rate": 9.40242935403702e-06, "loss": 1.8633, "step": 19534 }, { "epoch": 0.53, "learning_rate": 9.401546429839905e-06, "loss": 1.2156, "step": 19535 }, { "epoch": 0.53, "learning_rate": 9.400663510324803e-06, "loss": 1.2959, "step": 19536 }, { "epoch": 0.53, "learning_rate": 9.399780595498636e-06, "loss": 1.2478, "step": 19537 }, { "epoch": 0.53, "learning_rate": 9.398897685368297e-06, "loss": 1.334, "step": 19538 }, { "epoch": 0.53, "learning_rate": 9.398014779940706e-06, "loss": 1.301, "step": 19539 }, { "epoch": 0.53, "learning_rate": 9.397131879222759e-06, "loss": 1.2976, "step": 19540 }, { "epoch": 0.53, "learning_rate": 9.396248983221369e-06, "loss": 1.2876, "step": 19541 }, { "epoch": 0.53, "learning_rate": 9.395366091943445e-06, "loss": 1.2886, "step": 19542 }, { "epoch": 0.53, "learning_rate": 9.394483205395891e-06, "loss": 1.3804, "step": 19543 }, { "epoch": 0.53, "learning_rate": 9.393600323585618e-06, "loss": 1.3291, "step": 19544 }, { "epoch": 0.53, "learning_rate": 9.39271744651953e-06, "loss": 1.2288, "step": 19545 }, { "epoch": 0.53, "learning_rate": 9.391834574204535e-06, "loss": 1.4092, "step": 19546 }, { "epoch": 0.53, "learning_rate": 9.39095170664754e-06, "loss": 1.2405, "step": 19547 }, { "epoch": 0.53, "learning_rate": 9.390068843855451e-06, "loss": 1.3311, "step": 19548 }, { "epoch": 0.53, "learning_rate": 9.389185985835178e-06, "loss": 1.3528, "step": 19549 }, { "epoch": 0.53, "learning_rate": 9.388303132593627e-06, "loss": 1.1042, "step": 19550 }, { "epoch": 0.53, "learning_rate": 9.387420284137704e-06, "loss": 1.3567, "step": 19551 }, { "epoch": 0.53, "learning_rate": 9.386537440474319e-06, "loss": 1.4988, "step": 19552 }, { "epoch": 0.53, "learning_rate": 9.385654601610373e-06, "loss": 1.2393, "step": 19553 }, { "epoch": 0.53, "learning_rate": 9.384771767552779e-06, "loss": 1.4221, "step": 19554 }, { "epoch": 0.53, "learning_rate": 9.383888938308439e-06, "loss": 1.3142, "step": 19555 }, { "epoch": 0.53, "learning_rate": 9.383006113884264e-06, "loss": 1.3318, "step": 19556 }, { "epoch": 0.53, "learning_rate": 9.38212329428716e-06, "loss": 1.3083, "step": 19557 }, { "epoch": 0.53, "learning_rate": 9.38124047952403e-06, "loss": 1.1985, "step": 19558 }, { "epoch": 0.53, "learning_rate": 9.380357669601786e-06, "loss": 1.1565, "step": 19559 }, { "epoch": 0.53, "learning_rate": 9.37947486452733e-06, "loss": 1.2507, "step": 19560 }, { "epoch": 0.53, "learning_rate": 9.378592064307575e-06, "loss": 1.2446, "step": 19561 }, { "epoch": 0.53, "learning_rate": 9.377709268949418e-06, "loss": 1.2075, "step": 19562 }, { "epoch": 0.53, "learning_rate": 9.376826478459775e-06, "loss": 1.3064, "step": 19563 }, { "epoch": 0.53, "learning_rate": 9.375943692845546e-06, "loss": 1.1938, "step": 19564 }, { "epoch": 0.53, "learning_rate": 9.375060912113643e-06, "loss": 1.2419, "step": 19565 }, { "epoch": 0.53, "learning_rate": 9.374178136270968e-06, "loss": 1.2681, "step": 19566 }, { "epoch": 0.53, "learning_rate": 9.37329536532443e-06, "loss": 1.2258, "step": 19567 }, { "epoch": 0.53, "learning_rate": 9.372412599280931e-06, "loss": 1.2153, "step": 19568 }, { "epoch": 0.53, "learning_rate": 9.371529838147385e-06, "loss": 1.2056, "step": 19569 }, { "epoch": 0.53, "learning_rate": 9.37064708193069e-06, "loss": 1.2041, "step": 19570 }, { "epoch": 0.53, "learning_rate": 9.36976433063776e-06, "loss": 1.3113, "step": 19571 }, { "epoch": 0.53, "learning_rate": 9.368881584275496e-06, "loss": 1.2166, "step": 19572 }, { "epoch": 0.53, "learning_rate": 9.367998842850802e-06, "loss": 1.1936, "step": 19573 }, { "epoch": 0.53, "learning_rate": 9.367116106370593e-06, "loss": 1.2476, "step": 19574 }, { "epoch": 0.53, "learning_rate": 9.366233374841766e-06, "loss": 1.3784, "step": 19575 }, { "epoch": 0.53, "learning_rate": 9.365350648271237e-06, "loss": 1.3291, "step": 19576 }, { "epoch": 0.53, "learning_rate": 9.3644679266659e-06, "loss": 1.3616, "step": 19577 }, { "epoch": 0.53, "learning_rate": 9.363585210032673e-06, "loss": 1.4656, "step": 19578 }, { "epoch": 0.53, "learning_rate": 9.362702498378448e-06, "loss": 1.2358, "step": 19579 }, { "epoch": 0.53, "learning_rate": 9.361819791710148e-06, "loss": 1.3123, "step": 19580 }, { "epoch": 0.53, "learning_rate": 9.360937090034662e-06, "loss": 1.3838, "step": 19581 }, { "epoch": 0.53, "learning_rate": 9.36005439335891e-06, "loss": 1.2139, "step": 19582 }, { "epoch": 0.53, "learning_rate": 9.359171701689787e-06, "loss": 1.3362, "step": 19583 }, { "epoch": 0.53, "learning_rate": 9.358289015034208e-06, "loss": 1.1675, "step": 19584 }, { "epoch": 0.53, "learning_rate": 9.357406333399069e-06, "loss": 1.3445, "step": 19585 }, { "epoch": 0.53, "learning_rate": 9.356523656791286e-06, "loss": 1.3142, "step": 19586 }, { "epoch": 0.53, "learning_rate": 9.355640985217752e-06, "loss": 1.2659, "step": 19587 }, { "epoch": 0.53, "learning_rate": 9.354758318685381e-06, "loss": 1.3455, "step": 19588 }, { "epoch": 0.53, "learning_rate": 9.353875657201084e-06, "loss": 1.3008, "step": 19589 }, { "epoch": 0.53, "learning_rate": 9.352993000771755e-06, "loss": 1.1531, "step": 19590 }, { "epoch": 0.54, "learning_rate": 9.352110349404307e-06, "loss": 1.2712, "step": 19591 }, { "epoch": 0.54, "learning_rate": 9.35122770310564e-06, "loss": 1.1877, "step": 19592 }, { "epoch": 0.54, "learning_rate": 9.350345061882666e-06, "loss": 1.3418, "step": 19593 }, { "epoch": 0.54, "learning_rate": 9.349462425742283e-06, "loss": 1.2764, "step": 19594 }, { "epoch": 0.54, "learning_rate": 9.348579794691405e-06, "loss": 1.2517, "step": 19595 }, { "epoch": 0.54, "learning_rate": 9.347697168736927e-06, "loss": 1.2344, "step": 19596 }, { "epoch": 0.54, "learning_rate": 9.346814547885764e-06, "loss": 1.1235, "step": 19597 }, { "epoch": 0.54, "learning_rate": 9.345931932144815e-06, "loss": 1.2681, "step": 19598 }, { "epoch": 0.54, "learning_rate": 9.345049321520986e-06, "loss": 1.3267, "step": 19599 }, { "epoch": 0.54, "learning_rate": 9.344166716021185e-06, "loss": 1.2629, "step": 19600 }, { "epoch": 0.54, "learning_rate": 9.343284115652315e-06, "loss": 1.1411, "step": 19601 }, { "epoch": 0.54, "learning_rate": 9.34240152042128e-06, "loss": 1.2942, "step": 19602 }, { "epoch": 0.54, "learning_rate": 9.341518930334985e-06, "loss": 1.0604, "step": 19603 }, { "epoch": 0.54, "learning_rate": 9.340636345400339e-06, "loss": 1.3191, "step": 19604 }, { "epoch": 0.54, "learning_rate": 9.339753765624243e-06, "loss": 1.7251, "step": 19605 }, { "epoch": 0.54, "learning_rate": 9.338871191013604e-06, "loss": 1.2593, "step": 19606 }, { "epoch": 0.54, "learning_rate": 9.337988621575325e-06, "loss": 1.229, "step": 19607 }, { "epoch": 0.54, "learning_rate": 9.337106057316311e-06, "loss": 1.416, "step": 19608 }, { "epoch": 0.54, "learning_rate": 9.336223498243469e-06, "loss": 1.3074, "step": 19609 }, { "epoch": 0.54, "learning_rate": 9.335340944363702e-06, "loss": 1.332, "step": 19610 }, { "epoch": 0.54, "learning_rate": 9.334458395683915e-06, "loss": 1.3711, "step": 19611 }, { "epoch": 0.54, "learning_rate": 9.333575852211014e-06, "loss": 1.1641, "step": 19612 }, { "epoch": 0.54, "learning_rate": 9.332693313951898e-06, "loss": 1.2783, "step": 19613 }, { "epoch": 0.54, "learning_rate": 9.33181078091348e-06, "loss": 1.4727, "step": 19614 }, { "epoch": 0.54, "learning_rate": 9.330928253102658e-06, "loss": 1.2993, "step": 19615 }, { "epoch": 0.54, "learning_rate": 9.330045730526339e-06, "loss": 1.1853, "step": 19616 }, { "epoch": 0.54, "learning_rate": 9.329163213191426e-06, "loss": 1.2356, "step": 19617 }, { "epoch": 0.54, "learning_rate": 9.328280701104822e-06, "loss": 1.0936, "step": 19618 }, { "epoch": 0.54, "learning_rate": 9.327398194273442e-06, "loss": 1.373, "step": 19619 }, { "epoch": 0.54, "learning_rate": 9.326515692704175e-06, "loss": 1.1433, "step": 19620 }, { "epoch": 0.54, "learning_rate": 9.325633196403938e-06, "loss": 1.3931, "step": 19621 }, { "epoch": 0.54, "learning_rate": 9.324750705379624e-06, "loss": 1.2122, "step": 19622 }, { "epoch": 0.54, "learning_rate": 9.323868219638148e-06, "loss": 1.3398, "step": 19623 }, { "epoch": 0.54, "learning_rate": 9.322985739186406e-06, "loss": 1.3562, "step": 19624 }, { "epoch": 0.54, "learning_rate": 9.32210326403131e-06, "loss": 1.3435, "step": 19625 }, { "epoch": 0.54, "learning_rate": 9.321220794179751e-06, "loss": 1.2639, "step": 19626 }, { "epoch": 0.54, "learning_rate": 9.32033832963865e-06, "loss": 1.2207, "step": 19627 }, { "epoch": 0.54, "learning_rate": 9.319455870414895e-06, "loss": 1.2871, "step": 19628 }, { "epoch": 0.54, "learning_rate": 9.318573416515404e-06, "loss": 1.4463, "step": 19629 }, { "epoch": 0.54, "learning_rate": 9.317690967947068e-06, "loss": 1.3831, "step": 19630 }, { "epoch": 0.54, "learning_rate": 9.316808524716804e-06, "loss": 1.283, "step": 19631 }, { "epoch": 0.54, "learning_rate": 9.315926086831502e-06, "loss": 1.5093, "step": 19632 }, { "epoch": 0.54, "learning_rate": 9.315043654298078e-06, "loss": 1.2434, "step": 19633 }, { "epoch": 0.54, "learning_rate": 9.314161227123424e-06, "loss": 1.2405, "step": 19634 }, { "epoch": 0.54, "learning_rate": 9.313278805314453e-06, "loss": 1.3887, "step": 19635 }, { "epoch": 0.54, "learning_rate": 9.312396388878067e-06, "loss": 1.2729, "step": 19636 }, { "epoch": 0.54, "learning_rate": 9.311513977821168e-06, "loss": 1.3867, "step": 19637 }, { "epoch": 0.54, "learning_rate": 9.310631572150661e-06, "loss": 1.3313, "step": 19638 }, { "epoch": 0.54, "learning_rate": 9.309749171873445e-06, "loss": 1.4087, "step": 19639 }, { "epoch": 0.54, "learning_rate": 9.30886677699643e-06, "loss": 1.3464, "step": 19640 }, { "epoch": 0.54, "learning_rate": 9.307984387526514e-06, "loss": 1.2566, "step": 19641 }, { "epoch": 0.54, "learning_rate": 9.307102003470606e-06, "loss": 1.324, "step": 19642 }, { "epoch": 0.54, "learning_rate": 9.306219624835603e-06, "loss": 1.2971, "step": 19643 }, { "epoch": 0.54, "learning_rate": 9.305337251628413e-06, "loss": 1.4043, "step": 19644 }, { "epoch": 0.54, "learning_rate": 9.304454883855937e-06, "loss": 1.4614, "step": 19645 }, { "epoch": 0.54, "learning_rate": 9.30357252152508e-06, "loss": 1.2129, "step": 19646 }, { "epoch": 0.54, "learning_rate": 9.302690164642743e-06, "loss": 1.1892, "step": 19647 }, { "epoch": 0.54, "learning_rate": 9.301807813215832e-06, "loss": 1.207, "step": 19648 }, { "epoch": 0.54, "learning_rate": 9.300925467251246e-06, "loss": 1.4229, "step": 19649 }, { "epoch": 0.54, "learning_rate": 9.30004312675589e-06, "loss": 1.2837, "step": 19650 }, { "epoch": 0.54, "learning_rate": 9.29916079173667e-06, "loss": 1.3403, "step": 19651 }, { "epoch": 0.54, "learning_rate": 9.298278462200484e-06, "loss": 1.269, "step": 19652 }, { "epoch": 0.54, "learning_rate": 9.297396138154239e-06, "loss": 1.2002, "step": 19653 }, { "epoch": 0.54, "learning_rate": 9.296513819604835e-06, "loss": 1.2625, "step": 19654 }, { "epoch": 0.54, "learning_rate": 9.295631506559178e-06, "loss": 1.1399, "step": 19655 }, { "epoch": 0.54, "learning_rate": 9.294749199024167e-06, "loss": 1.1619, "step": 19656 }, { "epoch": 0.54, "learning_rate": 9.293866897006708e-06, "loss": 1.3267, "step": 19657 }, { "epoch": 0.54, "learning_rate": 9.292984600513702e-06, "loss": 1.3318, "step": 19658 }, { "epoch": 0.54, "learning_rate": 9.29210230955205e-06, "loss": 1.2349, "step": 19659 }, { "epoch": 0.54, "learning_rate": 9.291220024128658e-06, "loss": 1.2744, "step": 19660 }, { "epoch": 0.54, "learning_rate": 9.29033774425043e-06, "loss": 1.2698, "step": 19661 }, { "epoch": 0.54, "learning_rate": 9.289455469924262e-06, "loss": 1.2964, "step": 19662 }, { "epoch": 0.54, "learning_rate": 9.288573201157063e-06, "loss": 1.1323, "step": 19663 }, { "epoch": 0.54, "learning_rate": 9.28769093795573e-06, "loss": 1.3203, "step": 19664 }, { "epoch": 0.54, "learning_rate": 9.286808680327166e-06, "loss": 1.1716, "step": 19665 }, { "epoch": 0.54, "learning_rate": 9.285926428278284e-06, "loss": 1.3425, "step": 19666 }, { "epoch": 0.54, "learning_rate": 9.285044181815968e-06, "loss": 1.1643, "step": 19667 }, { "epoch": 0.54, "learning_rate": 9.284161940947139e-06, "loss": 1.2571, "step": 19668 }, { "epoch": 0.54, "learning_rate": 9.283279705678684e-06, "loss": 1.1865, "step": 19669 }, { "epoch": 0.54, "learning_rate": 9.282397476017517e-06, "loss": 1.2507, "step": 19670 }, { "epoch": 0.54, "learning_rate": 9.281515251970528e-06, "loss": 1.2983, "step": 19671 }, { "epoch": 0.54, "learning_rate": 9.280633033544633e-06, "loss": 1.2795, "step": 19672 }, { "epoch": 0.54, "learning_rate": 9.27975082074672e-06, "loss": 1.4253, "step": 19673 }, { "epoch": 0.54, "learning_rate": 9.278868613583705e-06, "loss": 1.282, "step": 19674 }, { "epoch": 0.54, "learning_rate": 9.277986412062476e-06, "loss": 1.2964, "step": 19675 }, { "epoch": 0.54, "learning_rate": 9.277104216189948e-06, "loss": 1.2676, "step": 19676 }, { "epoch": 0.54, "learning_rate": 9.27622202597301e-06, "loss": 1.282, "step": 19677 }, { "epoch": 0.54, "learning_rate": 9.275339841418578e-06, "loss": 1.3445, "step": 19678 }, { "epoch": 0.54, "learning_rate": 9.27445766253354e-06, "loss": 1.3923, "step": 19679 }, { "epoch": 0.54, "learning_rate": 9.273575489324808e-06, "loss": 1.3584, "step": 19680 }, { "epoch": 0.54, "learning_rate": 9.272693321799275e-06, "loss": 1.2197, "step": 19681 }, { "epoch": 0.54, "learning_rate": 9.271811159963851e-06, "loss": 1.343, "step": 19682 }, { "epoch": 0.54, "learning_rate": 9.270929003825434e-06, "loss": 1.4597, "step": 19683 }, { "epoch": 0.54, "learning_rate": 9.270046853390924e-06, "loss": 1.6802, "step": 19684 }, { "epoch": 0.54, "learning_rate": 9.269164708667228e-06, "loss": 1.2893, "step": 19685 }, { "epoch": 0.54, "learning_rate": 9.26828256966124e-06, "loss": 1.3564, "step": 19686 }, { "epoch": 0.54, "learning_rate": 9.267400436379867e-06, "loss": 1.2332, "step": 19687 }, { "epoch": 0.54, "learning_rate": 9.266518308830008e-06, "loss": 1.4456, "step": 19688 }, { "epoch": 0.54, "learning_rate": 9.265636187018564e-06, "loss": 1.21, "step": 19689 }, { "epoch": 0.54, "learning_rate": 9.264754070952437e-06, "loss": 1.3086, "step": 19690 }, { "epoch": 0.54, "learning_rate": 9.263871960638533e-06, "loss": 1.1868, "step": 19691 }, { "epoch": 0.54, "learning_rate": 9.262989856083742e-06, "loss": 1.4099, "step": 19692 }, { "epoch": 0.54, "learning_rate": 9.262107757294977e-06, "loss": 1.2834, "step": 19693 }, { "epoch": 0.54, "learning_rate": 9.26122566427913e-06, "loss": 1.3752, "step": 19694 }, { "epoch": 0.54, "learning_rate": 9.260343577043109e-06, "loss": 1.145, "step": 19695 }, { "epoch": 0.54, "learning_rate": 9.259461495593809e-06, "loss": 1.467, "step": 19696 }, { "epoch": 0.54, "learning_rate": 9.258579419938134e-06, "loss": 1.2263, "step": 19697 }, { "epoch": 0.54, "learning_rate": 9.257697350082989e-06, "loss": 1.3196, "step": 19698 }, { "epoch": 0.54, "learning_rate": 9.256815286035268e-06, "loss": 1.3276, "step": 19699 }, { "epoch": 0.54, "learning_rate": 9.255933227801875e-06, "loss": 1.1316, "step": 19700 }, { "epoch": 0.54, "learning_rate": 9.255051175389712e-06, "loss": 1.5405, "step": 19701 }, { "epoch": 0.54, "learning_rate": 9.254169128805677e-06, "loss": 1.2786, "step": 19702 }, { "epoch": 0.54, "learning_rate": 9.25328708805667e-06, "loss": 1.4214, "step": 19703 }, { "epoch": 0.54, "learning_rate": 9.252405053149598e-06, "loss": 1.3452, "step": 19704 }, { "epoch": 0.54, "learning_rate": 9.251523024091354e-06, "loss": 1.1638, "step": 19705 }, { "epoch": 0.54, "learning_rate": 9.250641000888846e-06, "loss": 1.1865, "step": 19706 }, { "epoch": 0.54, "learning_rate": 9.249758983548964e-06, "loss": 1.1182, "step": 19707 }, { "epoch": 0.54, "learning_rate": 9.24887697207862e-06, "loss": 1.29, "step": 19708 }, { "epoch": 0.54, "learning_rate": 9.247994966484707e-06, "loss": 1.2666, "step": 19709 }, { "epoch": 0.54, "learning_rate": 9.24711296677413e-06, "loss": 1.1926, "step": 19710 }, { "epoch": 0.54, "learning_rate": 9.246230972953785e-06, "loss": 1.6978, "step": 19711 }, { "epoch": 0.54, "learning_rate": 9.245348985030571e-06, "loss": 1.1384, "step": 19712 }, { "epoch": 0.54, "learning_rate": 9.2444670030114e-06, "loss": 1.2178, "step": 19713 }, { "epoch": 0.54, "learning_rate": 9.243585026903155e-06, "loss": 1.3606, "step": 19714 }, { "epoch": 0.54, "learning_rate": 9.242703056712754e-06, "loss": 1.3105, "step": 19715 }, { "epoch": 0.54, "learning_rate": 9.241821092447081e-06, "loss": 1.1189, "step": 19716 }, { "epoch": 0.54, "learning_rate": 9.240939134113049e-06, "loss": 1.4319, "step": 19717 }, { "epoch": 0.54, "learning_rate": 9.240057181717546e-06, "loss": 1.3198, "step": 19718 }, { "epoch": 0.54, "learning_rate": 9.239175235267485e-06, "loss": 1.1902, "step": 19719 }, { "epoch": 0.54, "learning_rate": 9.238293294769753e-06, "loss": 1.2751, "step": 19720 }, { "epoch": 0.54, "learning_rate": 9.237411360231263e-06, "loss": 1.0574, "step": 19721 }, { "epoch": 0.54, "learning_rate": 9.236529431658901e-06, "loss": 1.5698, "step": 19722 }, { "epoch": 0.54, "learning_rate": 9.23564750905958e-06, "loss": 1.407, "step": 19723 }, { "epoch": 0.54, "learning_rate": 9.234765592440186e-06, "loss": 1.271, "step": 19724 }, { "epoch": 0.54, "learning_rate": 9.233883681807634e-06, "loss": 1.2769, "step": 19725 }, { "epoch": 0.54, "learning_rate": 9.233001777168808e-06, "loss": 1.3062, "step": 19726 }, { "epoch": 0.54, "learning_rate": 9.232119878530619e-06, "loss": 1.2847, "step": 19727 }, { "epoch": 0.54, "learning_rate": 9.231237985899964e-06, "loss": 1.1815, "step": 19728 }, { "epoch": 0.54, "learning_rate": 9.23035609928374e-06, "loss": 1.2576, "step": 19729 }, { "epoch": 0.54, "learning_rate": 9.229474218688851e-06, "loss": 1.2893, "step": 19730 }, { "epoch": 0.54, "learning_rate": 9.22859234412219e-06, "loss": 1.3491, "step": 19731 }, { "epoch": 0.54, "learning_rate": 9.227710475590662e-06, "loss": 1.4294, "step": 19732 }, { "epoch": 0.54, "learning_rate": 9.226828613101163e-06, "loss": 1.3237, "step": 19733 }, { "epoch": 0.54, "learning_rate": 9.225946756660595e-06, "loss": 1.3232, "step": 19734 }, { "epoch": 0.54, "learning_rate": 9.225064906275852e-06, "loss": 1.262, "step": 19735 }, { "epoch": 0.54, "learning_rate": 9.22418306195384e-06, "loss": 1.3875, "step": 19736 }, { "epoch": 0.54, "learning_rate": 9.223301223701454e-06, "loss": 1.2773, "step": 19737 }, { "epoch": 0.54, "learning_rate": 9.222419391525595e-06, "loss": 1.1755, "step": 19738 }, { "epoch": 0.54, "learning_rate": 9.221537565433159e-06, "loss": 1.2534, "step": 19739 }, { "epoch": 0.54, "learning_rate": 9.220655745431049e-06, "loss": 1.2896, "step": 19740 }, { "epoch": 0.54, "learning_rate": 9.21977393152616e-06, "loss": 1.4089, "step": 19741 }, { "epoch": 0.54, "learning_rate": 9.218892123725393e-06, "loss": 1.2449, "step": 19742 }, { "epoch": 0.54, "learning_rate": 9.218010322035648e-06, "loss": 1.2468, "step": 19743 }, { "epoch": 0.54, "learning_rate": 9.21712852646382e-06, "loss": 1.2476, "step": 19744 }, { "epoch": 0.54, "learning_rate": 9.216246737016814e-06, "loss": 1.3293, "step": 19745 }, { "epoch": 0.54, "learning_rate": 9.215364953701522e-06, "loss": 1.3501, "step": 19746 }, { "epoch": 0.54, "learning_rate": 9.214483176524847e-06, "loss": 1.0498, "step": 19747 }, { "epoch": 0.54, "learning_rate": 9.213601405493686e-06, "loss": 1.3118, "step": 19748 }, { "epoch": 0.54, "learning_rate": 9.212719640614939e-06, "loss": 1.2805, "step": 19749 }, { "epoch": 0.54, "learning_rate": 9.211837881895502e-06, "loss": 1.2563, "step": 19750 }, { "epoch": 0.54, "learning_rate": 9.210956129342275e-06, "loss": 1.3442, "step": 19751 }, { "epoch": 0.54, "learning_rate": 9.210074382962155e-06, "loss": 1.4041, "step": 19752 }, { "epoch": 0.54, "learning_rate": 9.209192642762044e-06, "loss": 1.3843, "step": 19753 }, { "epoch": 0.54, "learning_rate": 9.208310908748837e-06, "loss": 1.2864, "step": 19754 }, { "epoch": 0.54, "learning_rate": 9.207429180929433e-06, "loss": 1.1489, "step": 19755 }, { "epoch": 0.54, "learning_rate": 9.20654745931073e-06, "loss": 1.2385, "step": 19756 }, { "epoch": 0.54, "learning_rate": 9.205665743899628e-06, "loss": 1.2676, "step": 19757 }, { "epoch": 0.54, "learning_rate": 9.204784034703021e-06, "loss": 1.2197, "step": 19758 }, { "epoch": 0.54, "learning_rate": 9.203902331727808e-06, "loss": 1.2327, "step": 19759 }, { "epoch": 0.54, "learning_rate": 9.203020634980896e-06, "loss": 1.3098, "step": 19760 }, { "epoch": 0.54, "learning_rate": 9.202138944469168e-06, "loss": 1.1401, "step": 19761 }, { "epoch": 0.54, "learning_rate": 9.201257260199538e-06, "loss": 1.0918, "step": 19762 }, { "epoch": 0.54, "learning_rate": 9.200375582178888e-06, "loss": 1.1488, "step": 19763 }, { "epoch": 0.54, "learning_rate": 9.19949391041413e-06, "loss": 1.5176, "step": 19764 }, { "epoch": 0.54, "learning_rate": 9.198612244912148e-06, "loss": 1.3569, "step": 19765 }, { "epoch": 0.54, "learning_rate": 9.197730585679853e-06, "loss": 1.2571, "step": 19766 }, { "epoch": 0.54, "learning_rate": 9.196848932724133e-06, "loss": 1.2747, "step": 19767 }, { "epoch": 0.54, "learning_rate": 9.195967286051892e-06, "loss": 1.7061, "step": 19768 }, { "epoch": 0.54, "learning_rate": 9.195085645670022e-06, "loss": 1.3867, "step": 19769 }, { "epoch": 0.54, "learning_rate": 9.194204011585427e-06, "loss": 1.3813, "step": 19770 }, { "epoch": 0.54, "learning_rate": 9.193322383804998e-06, "loss": 1.4009, "step": 19771 }, { "epoch": 0.54, "learning_rate": 9.192440762335637e-06, "loss": 1.2603, "step": 19772 }, { "epoch": 0.54, "learning_rate": 9.191559147184238e-06, "loss": 1.3528, "step": 19773 }, { "epoch": 0.54, "learning_rate": 9.1906775383577e-06, "loss": 1.0771, "step": 19774 }, { "epoch": 0.54, "learning_rate": 9.189795935862923e-06, "loss": 1.2751, "step": 19775 }, { "epoch": 0.54, "learning_rate": 9.1889143397068e-06, "loss": 1.2122, "step": 19776 }, { "epoch": 0.54, "learning_rate": 9.18803274989623e-06, "loss": 1.2253, "step": 19777 }, { "epoch": 0.54, "learning_rate": 9.187151166438108e-06, "loss": 1.1431, "step": 19778 }, { "epoch": 0.54, "learning_rate": 9.186269589339337e-06, "loss": 1.0977, "step": 19779 }, { "epoch": 0.54, "learning_rate": 9.185388018606807e-06, "loss": 1.2446, "step": 19780 }, { "epoch": 0.54, "learning_rate": 9.18450645424742e-06, "loss": 1.3318, "step": 19781 }, { "epoch": 0.54, "learning_rate": 9.183624896268069e-06, "loss": 1.3135, "step": 19782 }, { "epoch": 0.54, "learning_rate": 9.182743344675655e-06, "loss": 1.2034, "step": 19783 }, { "epoch": 0.54, "learning_rate": 9.181861799477073e-06, "loss": 1.2637, "step": 19784 }, { "epoch": 0.54, "learning_rate": 9.180980260679217e-06, "loss": 1.4324, "step": 19785 }, { "epoch": 0.54, "learning_rate": 9.180098728288987e-06, "loss": 1.1292, "step": 19786 }, { "epoch": 0.54, "learning_rate": 9.179217202313282e-06, "loss": 1.2627, "step": 19787 }, { "epoch": 0.54, "learning_rate": 9.178335682758992e-06, "loss": 1.4453, "step": 19788 }, { "epoch": 0.54, "learning_rate": 9.177454169633017e-06, "loss": 1.2949, "step": 19789 }, { "epoch": 0.54, "learning_rate": 9.176572662942257e-06, "loss": 1.2227, "step": 19790 }, { "epoch": 0.54, "learning_rate": 9.175691162693602e-06, "loss": 1.4026, "step": 19791 }, { "epoch": 0.54, "learning_rate": 9.174809668893957e-06, "loss": 1.2661, "step": 19792 }, { "epoch": 0.54, "learning_rate": 9.173928181550206e-06, "loss": 1.2788, "step": 19793 }, { "epoch": 0.54, "learning_rate": 9.173046700669258e-06, "loss": 1.2656, "step": 19794 }, { "epoch": 0.54, "learning_rate": 9.172165226258e-06, "loss": 1.3386, "step": 19795 }, { "epoch": 0.54, "learning_rate": 9.171283758323336e-06, "loss": 1.2859, "step": 19796 }, { "epoch": 0.54, "learning_rate": 9.170402296872154e-06, "loss": 1.4692, "step": 19797 }, { "epoch": 0.54, "learning_rate": 9.169520841911358e-06, "loss": 1.3064, "step": 19798 }, { "epoch": 0.54, "learning_rate": 9.168639393447836e-06, "loss": 1.5107, "step": 19799 }, { "epoch": 0.54, "learning_rate": 9.167757951488494e-06, "loss": 1.269, "step": 19800 }, { "epoch": 0.54, "learning_rate": 9.166876516040216e-06, "loss": 1.3, "step": 19801 }, { "epoch": 0.54, "learning_rate": 9.165995087109911e-06, "loss": 1.3696, "step": 19802 }, { "epoch": 0.54, "learning_rate": 9.165113664704462e-06, "loss": 1.2615, "step": 19803 }, { "epoch": 0.54, "learning_rate": 9.164232248830777e-06, "loss": 1.1848, "step": 19804 }, { "epoch": 0.54, "learning_rate": 9.16335083949574e-06, "loss": 1.1367, "step": 19805 }, { "epoch": 0.54, "learning_rate": 9.162469436706257e-06, "loss": 1.2561, "step": 19806 }, { "epoch": 0.54, "learning_rate": 9.161588040469218e-06, "loss": 1.198, "step": 19807 }, { "epoch": 0.54, "learning_rate": 9.160706650791519e-06, "loss": 1.363, "step": 19808 }, { "epoch": 0.54, "learning_rate": 9.159825267680058e-06, "loss": 1.2524, "step": 19809 }, { "epoch": 0.54, "learning_rate": 9.158943891141728e-06, "loss": 1.2678, "step": 19810 }, { "epoch": 0.54, "learning_rate": 9.158062521183427e-06, "loss": 1.3247, "step": 19811 }, { "epoch": 0.54, "learning_rate": 9.157181157812047e-06, "loss": 1.345, "step": 19812 }, { "epoch": 0.54, "learning_rate": 9.156299801034487e-06, "loss": 1.2617, "step": 19813 }, { "epoch": 0.54, "learning_rate": 9.15541845085764e-06, "loss": 1.3289, "step": 19814 }, { "epoch": 0.54, "learning_rate": 9.154537107288401e-06, "loss": 1.0964, "step": 19815 }, { "epoch": 0.54, "learning_rate": 9.153655770333667e-06, "loss": 1.3325, "step": 19816 }, { "epoch": 0.54, "learning_rate": 9.152774440000333e-06, "loss": 1.3472, "step": 19817 }, { "epoch": 0.54, "learning_rate": 9.151893116295291e-06, "loss": 1.2292, "step": 19818 }, { "epoch": 0.54, "learning_rate": 9.151011799225441e-06, "loss": 1.2749, "step": 19819 }, { "epoch": 0.54, "learning_rate": 9.150130488797673e-06, "loss": 1.3625, "step": 19820 }, { "epoch": 0.54, "learning_rate": 9.149249185018885e-06, "loss": 1.2803, "step": 19821 }, { "epoch": 0.54, "learning_rate": 9.148367887895975e-06, "loss": 1.261, "step": 19822 }, { "epoch": 0.54, "learning_rate": 9.14748659743583e-06, "loss": 1.0496, "step": 19823 }, { "epoch": 0.54, "learning_rate": 9.146605313645352e-06, "loss": 1.385, "step": 19824 }, { "epoch": 0.54, "learning_rate": 9.14572403653143e-06, "loss": 1.3721, "step": 19825 }, { "epoch": 0.54, "learning_rate": 9.144842766100963e-06, "loss": 1.23, "step": 19826 }, { "epoch": 0.54, "learning_rate": 9.143961502360842e-06, "loss": 1.0581, "step": 19827 }, { "epoch": 0.54, "learning_rate": 9.143080245317966e-06, "loss": 1.2883, "step": 19828 }, { "epoch": 0.54, "learning_rate": 9.142198994979227e-06, "loss": 1.2368, "step": 19829 }, { "epoch": 0.54, "learning_rate": 9.14131775135152e-06, "loss": 1.2402, "step": 19830 }, { "epoch": 0.54, "learning_rate": 9.140436514441737e-06, "loss": 1.2407, "step": 19831 }, { "epoch": 0.54, "learning_rate": 9.139555284256778e-06, "loss": 1.3323, "step": 19832 }, { "epoch": 0.54, "learning_rate": 9.13867406080353e-06, "loss": 1.364, "step": 19833 }, { "epoch": 0.54, "learning_rate": 9.137792844088893e-06, "loss": 1.4819, "step": 19834 }, { "epoch": 0.54, "learning_rate": 9.136911634119758e-06, "loss": 1.2175, "step": 19835 }, { "epoch": 0.54, "learning_rate": 9.136030430903018e-06, "loss": 1.3477, "step": 19836 }, { "epoch": 0.54, "learning_rate": 9.135149234445578e-06, "loss": 1.3511, "step": 19837 }, { "epoch": 0.54, "learning_rate": 9.134268044754315e-06, "loss": 1.3215, "step": 19838 }, { "epoch": 0.54, "learning_rate": 9.13338686183614e-06, "loss": 1.1301, "step": 19839 }, { "epoch": 0.54, "learning_rate": 9.13250568569793e-06, "loss": 1.3091, "step": 19840 }, { "epoch": 0.54, "learning_rate": 9.131624516346595e-06, "loss": 1.1731, "step": 19841 }, { "epoch": 0.54, "learning_rate": 9.130743353789016e-06, "loss": 1.2383, "step": 19842 }, { "epoch": 0.54, "learning_rate": 9.129862198032098e-06, "loss": 1.3677, "step": 19843 }, { "epoch": 0.54, "learning_rate": 9.128981049082722e-06, "loss": 1.4475, "step": 19844 }, { "epoch": 0.54, "learning_rate": 9.128099906947796e-06, "loss": 1.2878, "step": 19845 }, { "epoch": 0.54, "learning_rate": 9.1272187716342e-06, "loss": 1.2549, "step": 19846 }, { "epoch": 0.54, "learning_rate": 9.12633764314884e-06, "loss": 1.2996, "step": 19847 }, { "epoch": 0.54, "learning_rate": 9.125456521498596e-06, "loss": 1.2698, "step": 19848 }, { "epoch": 0.54, "learning_rate": 9.124575406690377e-06, "loss": 1.1294, "step": 19849 }, { "epoch": 0.54, "learning_rate": 9.12369429873106e-06, "loss": 1.2764, "step": 19850 }, { "epoch": 0.54, "learning_rate": 9.122813197627551e-06, "loss": 1.2109, "step": 19851 }, { "epoch": 0.54, "learning_rate": 9.12193210338674e-06, "loss": 1.3137, "step": 19852 }, { "epoch": 0.54, "learning_rate": 9.121051016015517e-06, "loss": 1.3613, "step": 19853 }, { "epoch": 0.54, "learning_rate": 9.12016993552078e-06, "loss": 1.3616, "step": 19854 }, { "epoch": 0.54, "learning_rate": 9.119288861909419e-06, "loss": 1.2651, "step": 19855 }, { "epoch": 0.54, "learning_rate": 9.118407795188329e-06, "loss": 1.3237, "step": 19856 }, { "epoch": 0.54, "learning_rate": 9.117526735364399e-06, "loss": 1.2649, "step": 19857 }, { "epoch": 0.54, "learning_rate": 9.116645682444527e-06, "loss": 1.325, "step": 19858 }, { "epoch": 0.54, "learning_rate": 9.115764636435603e-06, "loss": 1.2397, "step": 19859 }, { "epoch": 0.54, "learning_rate": 9.11488359734452e-06, "loss": 1.2927, "step": 19860 }, { "epoch": 0.54, "learning_rate": 9.114002565178172e-06, "loss": 1.3423, "step": 19861 }, { "epoch": 0.54, "learning_rate": 9.113121539943453e-06, "loss": 1.3411, "step": 19862 }, { "epoch": 0.54, "learning_rate": 9.112240521647251e-06, "loss": 1.3936, "step": 19863 }, { "epoch": 0.54, "learning_rate": 9.111359510296464e-06, "loss": 1.3875, "step": 19864 }, { "epoch": 0.54, "learning_rate": 9.110478505897982e-06, "loss": 1.2037, "step": 19865 }, { "epoch": 0.54, "learning_rate": 9.109597508458698e-06, "loss": 1.3206, "step": 19866 }, { "epoch": 0.54, "learning_rate": 9.108716517985503e-06, "loss": 1.24, "step": 19867 }, { "epoch": 0.54, "learning_rate": 9.107835534485291e-06, "loss": 1.4541, "step": 19868 }, { "epoch": 0.54, "learning_rate": 9.106954557964956e-06, "loss": 1.2134, "step": 19869 }, { "epoch": 0.54, "learning_rate": 9.106073588431387e-06, "loss": 1.2058, "step": 19870 }, { "epoch": 0.54, "learning_rate": 9.10519262589148e-06, "loss": 1.2356, "step": 19871 }, { "epoch": 0.54, "learning_rate": 9.104311670352122e-06, "loss": 1.2102, "step": 19872 }, { "epoch": 0.54, "learning_rate": 9.10343072182021e-06, "loss": 1.2354, "step": 19873 }, { "epoch": 0.54, "learning_rate": 9.102549780302635e-06, "loss": 1.1951, "step": 19874 }, { "epoch": 0.54, "learning_rate": 9.101668845806288e-06, "loss": 1.2554, "step": 19875 }, { "epoch": 0.54, "learning_rate": 9.100787918338062e-06, "loss": 1.2998, "step": 19876 }, { "epoch": 0.54, "learning_rate": 9.099906997904849e-06, "loss": 1.3652, "step": 19877 }, { "epoch": 0.54, "learning_rate": 9.099026084513537e-06, "loss": 1.1943, "step": 19878 }, { "epoch": 0.54, "learning_rate": 9.098145178171026e-06, "loss": 1.3127, "step": 19879 }, { "epoch": 0.54, "learning_rate": 9.097264278884199e-06, "loss": 1.2107, "step": 19880 }, { "epoch": 0.54, "learning_rate": 9.096383386659954e-06, "loss": 1.0918, "step": 19881 }, { "epoch": 0.54, "learning_rate": 9.095502501505179e-06, "loss": 1.2239, "step": 19882 }, { "epoch": 0.54, "learning_rate": 9.094621623426764e-06, "loss": 1.5044, "step": 19883 }, { "epoch": 0.54, "learning_rate": 9.093740752431612e-06, "loss": 1.3208, "step": 19884 }, { "epoch": 0.54, "learning_rate": 9.092859888526598e-06, "loss": 1.428, "step": 19885 }, { "epoch": 0.54, "learning_rate": 9.091979031718629e-06, "loss": 1.446, "step": 19886 }, { "epoch": 0.54, "learning_rate": 9.091098182014581e-06, "loss": 1.4482, "step": 19887 }, { "epoch": 0.54, "learning_rate": 9.090217339421362e-06, "loss": 1.21, "step": 19888 }, { "epoch": 0.54, "learning_rate": 9.089336503945848e-06, "loss": 1.3137, "step": 19889 }, { "epoch": 0.54, "learning_rate": 9.088455675594942e-06, "loss": 1.2336, "step": 19890 }, { "epoch": 0.54, "learning_rate": 9.087574854375527e-06, "loss": 1.4014, "step": 19891 }, { "epoch": 0.54, "learning_rate": 9.0866940402945e-06, "loss": 1.3049, "step": 19892 }, { "epoch": 0.54, "learning_rate": 9.085813233358745e-06, "loss": 1.2041, "step": 19893 }, { "epoch": 0.54, "learning_rate": 9.084932433575162e-06, "loss": 1.4182, "step": 19894 }, { "epoch": 0.54, "learning_rate": 9.084051640950633e-06, "loss": 1.2222, "step": 19895 }, { "epoch": 0.54, "learning_rate": 9.083170855492058e-06, "loss": 1.293, "step": 19896 }, { "epoch": 0.54, "learning_rate": 9.082290077206317e-06, "loss": 1.2734, "step": 19897 }, { "epoch": 0.54, "learning_rate": 9.081409306100311e-06, "loss": 1.2493, "step": 19898 }, { "epoch": 0.54, "learning_rate": 9.080528542180926e-06, "loss": 1.3103, "step": 19899 }, { "epoch": 0.54, "learning_rate": 9.079647785455052e-06, "loss": 1.2239, "step": 19900 }, { "epoch": 0.54, "learning_rate": 9.078767035929584e-06, "loss": 1.2732, "step": 19901 }, { "epoch": 0.54, "learning_rate": 9.077886293611408e-06, "loss": 1.2493, "step": 19902 }, { "epoch": 0.54, "learning_rate": 9.077005558507416e-06, "loss": 1.0891, "step": 19903 }, { "epoch": 0.54, "learning_rate": 9.076124830624498e-06, "loss": 1.1425, "step": 19904 }, { "epoch": 0.54, "learning_rate": 9.075244109969547e-06, "loss": 1.2517, "step": 19905 }, { "epoch": 0.54, "learning_rate": 9.074363396549448e-06, "loss": 1.3049, "step": 19906 }, { "epoch": 0.54, "learning_rate": 9.073482690371096e-06, "loss": 1.5173, "step": 19907 }, { "epoch": 0.54, "learning_rate": 9.07260199144138e-06, "loss": 1.7451, "step": 19908 }, { "epoch": 0.54, "learning_rate": 9.071721299767192e-06, "loss": 1.262, "step": 19909 }, { "epoch": 0.54, "learning_rate": 9.070840615355415e-06, "loss": 1.3286, "step": 19910 }, { "epoch": 0.54, "learning_rate": 9.069959938212948e-06, "loss": 1.2864, "step": 19911 }, { "epoch": 0.54, "learning_rate": 9.069079268346675e-06, "loss": 1.4377, "step": 19912 }, { "epoch": 0.54, "learning_rate": 9.068198605763488e-06, "loss": 1.0453, "step": 19913 }, { "epoch": 0.54, "learning_rate": 9.067317950470278e-06, "loss": 1.366, "step": 19914 }, { "epoch": 0.54, "learning_rate": 9.066437302473934e-06, "loss": 1.3132, "step": 19915 }, { "epoch": 0.54, "learning_rate": 9.065556661781346e-06, "loss": 1.342, "step": 19916 }, { "epoch": 0.54, "learning_rate": 9.064676028399401e-06, "loss": 1.2766, "step": 19917 }, { "epoch": 0.54, "learning_rate": 9.063795402334994e-06, "loss": 1.2832, "step": 19918 }, { "epoch": 0.54, "learning_rate": 9.062914783595008e-06, "loss": 1.396, "step": 19919 }, { "epoch": 0.54, "learning_rate": 9.062034172186342e-06, "loss": 1.2617, "step": 19920 }, { "epoch": 0.54, "learning_rate": 9.061153568115874e-06, "loss": 1.2725, "step": 19921 }, { "epoch": 0.54, "learning_rate": 9.060272971390501e-06, "loss": 1.2322, "step": 19922 }, { "epoch": 0.54, "learning_rate": 9.059392382017109e-06, "loss": 1.46, "step": 19923 }, { "epoch": 0.54, "learning_rate": 9.058511800002591e-06, "loss": 1.2412, "step": 19924 }, { "epoch": 0.54, "learning_rate": 9.057631225353833e-06, "loss": 1.2161, "step": 19925 }, { "epoch": 0.54, "learning_rate": 9.056750658077726e-06, "loss": 1.3457, "step": 19926 }, { "epoch": 0.54, "learning_rate": 9.055870098181155e-06, "loss": 1.2424, "step": 19927 }, { "epoch": 0.54, "learning_rate": 9.054989545671017e-06, "loss": 1.3406, "step": 19928 }, { "epoch": 0.54, "learning_rate": 9.054109000554192e-06, "loss": 1.1318, "step": 19929 }, { "epoch": 0.54, "learning_rate": 9.053228462837573e-06, "loss": 1.0989, "step": 19930 }, { "epoch": 0.54, "learning_rate": 9.052347932528055e-06, "loss": 1.2878, "step": 19931 }, { "epoch": 0.54, "learning_rate": 9.051467409632515e-06, "loss": 1.3755, "step": 19932 }, { "epoch": 0.54, "learning_rate": 9.050586894157853e-06, "loss": 1.3433, "step": 19933 }, { "epoch": 0.54, "learning_rate": 9.049706386110949e-06, "loss": 1.4817, "step": 19934 }, { "epoch": 0.54, "learning_rate": 9.0488258854987e-06, "loss": 1.3203, "step": 19935 }, { "epoch": 0.54, "learning_rate": 9.047945392327982e-06, "loss": 1.3477, "step": 19936 }, { "epoch": 0.54, "learning_rate": 9.047064906605701e-06, "loss": 1.3442, "step": 19937 }, { "epoch": 0.54, "learning_rate": 9.046184428338728e-06, "loss": 1.2922, "step": 19938 }, { "epoch": 0.54, "learning_rate": 9.045303957533966e-06, "loss": 1.2625, "step": 19939 }, { "epoch": 0.54, "learning_rate": 9.04442349419829e-06, "loss": 1.2302, "step": 19940 }, { "epoch": 0.54, "learning_rate": 9.043543038338603e-06, "loss": 1.3645, "step": 19941 }, { "epoch": 0.54, "learning_rate": 9.04266258996178e-06, "loss": 1.3572, "step": 19942 }, { "epoch": 0.54, "learning_rate": 9.04178214907472e-06, "loss": 1.3276, "step": 19943 }, { "epoch": 0.54, "learning_rate": 9.040901715684298e-06, "loss": 1.2859, "step": 19944 }, { "epoch": 0.54, "learning_rate": 9.040021289797414e-06, "loss": 1.2783, "step": 19945 }, { "epoch": 0.54, "learning_rate": 9.039140871420953e-06, "loss": 1.198, "step": 19946 }, { "epoch": 0.54, "learning_rate": 9.0382604605618e-06, "loss": 1.2468, "step": 19947 }, { "epoch": 0.54, "learning_rate": 9.037380057226848e-06, "loss": 1.2935, "step": 19948 }, { "epoch": 0.54, "learning_rate": 9.036499661422978e-06, "loss": 1.3174, "step": 19949 }, { "epoch": 0.54, "learning_rate": 9.035619273157086e-06, "loss": 1.132, "step": 19950 }, { "epoch": 0.54, "learning_rate": 9.034738892436052e-06, "loss": 1.2366, "step": 19951 }, { "epoch": 0.54, "learning_rate": 9.033858519266769e-06, "loss": 1.2795, "step": 19952 }, { "epoch": 0.54, "learning_rate": 9.03297815365612e-06, "loss": 1.2715, "step": 19953 }, { "epoch": 0.54, "learning_rate": 9.032097795610998e-06, "loss": 1.231, "step": 19954 }, { "epoch": 0.54, "learning_rate": 9.031217445138285e-06, "loss": 1.3577, "step": 19955 }, { "epoch": 0.54, "learning_rate": 9.030337102244875e-06, "loss": 1.2771, "step": 19956 }, { "epoch": 0.55, "learning_rate": 9.029456766937646e-06, "loss": 1.2158, "step": 19957 }, { "epoch": 0.55, "learning_rate": 9.028576439223496e-06, "loss": 1.4375, "step": 19958 }, { "epoch": 0.55, "learning_rate": 9.027696119109305e-06, "loss": 1.3406, "step": 19959 }, { "epoch": 0.55, "learning_rate": 9.026815806601961e-06, "loss": 1.1648, "step": 19960 }, { "epoch": 0.55, "learning_rate": 9.025935501708355e-06, "loss": 1.2832, "step": 19961 }, { "epoch": 0.55, "learning_rate": 9.025055204435369e-06, "loss": 1.2397, "step": 19962 }, { "epoch": 0.55, "learning_rate": 9.024174914789896e-06, "loss": 1.3333, "step": 19963 }, { "epoch": 0.55, "learning_rate": 9.023294632778817e-06, "loss": 1.2437, "step": 19964 }, { "epoch": 0.55, "learning_rate": 9.022414358409024e-06, "loss": 1.3892, "step": 19965 }, { "epoch": 0.55, "learning_rate": 9.021534091687398e-06, "loss": 1.1899, "step": 19966 }, { "epoch": 0.55, "learning_rate": 9.020653832620832e-06, "loss": 1.3335, "step": 19967 }, { "epoch": 0.55, "learning_rate": 9.019773581216208e-06, "loss": 1.2683, "step": 19968 }, { "epoch": 0.55, "learning_rate": 9.018893337480417e-06, "loss": 1.2842, "step": 19969 }, { "epoch": 0.55, "learning_rate": 9.01801310142034e-06, "loss": 1.3604, "step": 19970 }, { "epoch": 0.55, "learning_rate": 9.017132873042869e-06, "loss": 1.2458, "step": 19971 }, { "epoch": 0.55, "learning_rate": 9.016252652354887e-06, "loss": 1.2478, "step": 19972 }, { "epoch": 0.55, "learning_rate": 9.015372439363283e-06, "loss": 1.4004, "step": 19973 }, { "epoch": 0.55, "learning_rate": 9.014492234074939e-06, "loss": 1.3357, "step": 19974 }, { "epoch": 0.55, "learning_rate": 9.013612036496745e-06, "loss": 1.3409, "step": 19975 }, { "epoch": 0.55, "learning_rate": 9.012731846635591e-06, "loss": 1.3225, "step": 19976 }, { "epoch": 0.55, "learning_rate": 9.011851664498352e-06, "loss": 1.2092, "step": 19977 }, { "epoch": 0.55, "learning_rate": 9.010971490091928e-06, "loss": 1.2517, "step": 19978 }, { "epoch": 0.55, "learning_rate": 9.010091323423192e-06, "loss": 1.325, "step": 19979 }, { "epoch": 0.55, "learning_rate": 9.009211164499042e-06, "loss": 1.2954, "step": 19980 }, { "epoch": 0.55, "learning_rate": 9.008331013326352e-06, "loss": 1.2483, "step": 19981 }, { "epoch": 0.55, "learning_rate": 9.00745086991202e-06, "loss": 1.4146, "step": 19982 }, { "epoch": 0.55, "learning_rate": 9.00657073426292e-06, "loss": 1.2893, "step": 19983 }, { "epoch": 0.55, "learning_rate": 9.005690606385949e-06, "loss": 1.2312, "step": 19984 }, { "epoch": 0.55, "learning_rate": 9.00481048628798e-06, "loss": 1.2765, "step": 19985 }, { "epoch": 0.55, "learning_rate": 9.003930373975913e-06, "loss": 1.2661, "step": 19986 }, { "epoch": 0.55, "learning_rate": 9.003050269456619e-06, "loss": 1.293, "step": 19987 }, { "epoch": 0.55, "learning_rate": 9.002170172736999e-06, "loss": 1.3594, "step": 19988 }, { "epoch": 0.55, "learning_rate": 9.001290083823923e-06, "loss": 1.1636, "step": 19989 }, { "epoch": 0.55, "learning_rate": 9.00041000272429e-06, "loss": 1.4673, "step": 19990 }, { "epoch": 0.55, "learning_rate": 8.999529929444972e-06, "loss": 1.2727, "step": 19991 }, { "epoch": 0.55, "learning_rate": 8.998649863992866e-06, "loss": 1.2644, "step": 19992 }, { "epoch": 0.55, "learning_rate": 8.997769806374851e-06, "loss": 1.4373, "step": 19993 }, { "epoch": 0.55, "learning_rate": 8.996889756597815e-06, "loss": 1.2644, "step": 19994 }, { "epoch": 0.55, "learning_rate": 8.996009714668643e-06, "loss": 1.1433, "step": 19995 }, { "epoch": 0.55, "learning_rate": 8.995129680594216e-06, "loss": 1.3655, "step": 19996 }, { "epoch": 0.55, "learning_rate": 8.994249654381426e-06, "loss": 1.2136, "step": 19997 }, { "epoch": 0.55, "learning_rate": 8.99336963603715e-06, "loss": 1.2693, "step": 19998 }, { "epoch": 0.55, "learning_rate": 8.992489625568278e-06, "loss": 1.7178, "step": 19999 }, { "epoch": 0.55, "learning_rate": 8.991609622981693e-06, "loss": 1.1841, "step": 20000 }, { "epoch": 0.55, "learning_rate": 8.99072962828428e-06, "loss": 1.2581, "step": 20001 }, { "epoch": 0.55, "learning_rate": 8.989849641482924e-06, "loss": 1.1777, "step": 20002 }, { "epoch": 0.55, "learning_rate": 8.98896966258451e-06, "loss": 1.301, "step": 20003 }, { "epoch": 0.55, "learning_rate": 8.988089691595921e-06, "loss": 1.3394, "step": 20004 }, { "epoch": 0.55, "learning_rate": 8.987209728524043e-06, "loss": 1.2781, "step": 20005 }, { "epoch": 0.55, "learning_rate": 8.98632977337576e-06, "loss": 1.3762, "step": 20006 }, { "epoch": 0.55, "learning_rate": 8.985449826157955e-06, "loss": 1.2192, "step": 20007 }, { "epoch": 0.55, "learning_rate": 8.984569886877515e-06, "loss": 1.4648, "step": 20008 }, { "epoch": 0.55, "learning_rate": 8.983689955541322e-06, "loss": 1.2085, "step": 20009 }, { "epoch": 0.55, "learning_rate": 8.982810032156261e-06, "loss": 1.3806, "step": 20010 }, { "epoch": 0.55, "learning_rate": 8.981930116729216e-06, "loss": 1.3374, "step": 20011 }, { "epoch": 0.55, "learning_rate": 8.981050209267072e-06, "loss": 1.3506, "step": 20012 }, { "epoch": 0.55, "learning_rate": 8.980170309776709e-06, "loss": 1.1606, "step": 20013 }, { "epoch": 0.55, "learning_rate": 8.979290418265018e-06, "loss": 1.2864, "step": 20014 }, { "epoch": 0.55, "learning_rate": 8.978410534738875e-06, "loss": 1.2881, "step": 20015 }, { "epoch": 0.55, "learning_rate": 8.97753065920517e-06, "loss": 1.2695, "step": 20016 }, { "epoch": 0.55, "learning_rate": 8.976650791670784e-06, "loss": 1.2222, "step": 20017 }, { "epoch": 0.55, "learning_rate": 8.975770932142602e-06, "loss": 1.2883, "step": 20018 }, { "epoch": 0.55, "learning_rate": 8.974891080627504e-06, "loss": 1.7974, "step": 20019 }, { "epoch": 0.55, "learning_rate": 8.974011237132379e-06, "loss": 1.3396, "step": 20020 }, { "epoch": 0.55, "learning_rate": 8.973131401664103e-06, "loss": 1.3052, "step": 20021 }, { "epoch": 0.55, "learning_rate": 8.972251574229564e-06, "loss": 1.3931, "step": 20022 }, { "epoch": 0.55, "learning_rate": 8.971371754835653e-06, "loss": 1.3662, "step": 20023 }, { "epoch": 0.55, "learning_rate": 8.970491943489238e-06, "loss": 1.2991, "step": 20024 }, { "epoch": 0.55, "learning_rate": 8.969612140197216e-06, "loss": 1.3303, "step": 20025 }, { "epoch": 0.55, "learning_rate": 8.968732344966458e-06, "loss": 1.2949, "step": 20026 }, { "epoch": 0.55, "learning_rate": 8.96785255780386e-06, "loss": 1.3826, "step": 20027 }, { "epoch": 0.55, "learning_rate": 8.96697277871629e-06, "loss": 1.324, "step": 20028 }, { "epoch": 0.55, "learning_rate": 8.966093007710647e-06, "loss": 1.2772, "step": 20029 }, { "epoch": 0.55, "learning_rate": 8.965213244793802e-06, "loss": 1.355, "step": 20030 }, { "epoch": 0.55, "learning_rate": 8.964333489972643e-06, "loss": 1.1914, "step": 20031 }, { "epoch": 0.55, "learning_rate": 8.963453743254052e-06, "loss": 1.4146, "step": 20032 }, { "epoch": 0.55, "learning_rate": 8.962574004644912e-06, "loss": 1.4424, "step": 20033 }, { "epoch": 0.55, "learning_rate": 8.961694274152103e-06, "loss": 1.3394, "step": 20034 }, { "epoch": 0.55, "learning_rate": 8.960814551782513e-06, "loss": 1.1741, "step": 20035 }, { "epoch": 0.55, "learning_rate": 8.959934837543017e-06, "loss": 1.2957, "step": 20036 }, { "epoch": 0.55, "learning_rate": 8.959055131440503e-06, "loss": 1.2776, "step": 20037 }, { "epoch": 0.55, "learning_rate": 8.958175433481855e-06, "loss": 1.3738, "step": 20038 }, { "epoch": 0.55, "learning_rate": 8.957295743673951e-06, "loss": 1.1804, "step": 20039 }, { "epoch": 0.55, "learning_rate": 8.956416062023676e-06, "loss": 1.1858, "step": 20040 }, { "epoch": 0.55, "learning_rate": 8.955536388537907e-06, "loss": 1.25, "step": 20041 }, { "epoch": 0.55, "learning_rate": 8.954656723223534e-06, "loss": 1.3923, "step": 20042 }, { "epoch": 0.55, "learning_rate": 8.953777066087434e-06, "loss": 1.2429, "step": 20043 }, { "epoch": 0.55, "learning_rate": 8.952897417136491e-06, "loss": 1.3098, "step": 20044 }, { "epoch": 0.55, "learning_rate": 8.952017776377584e-06, "loss": 1.3926, "step": 20045 }, { "epoch": 0.55, "learning_rate": 8.9511381438176e-06, "loss": 1.3486, "step": 20046 }, { "epoch": 0.55, "learning_rate": 8.950258519463416e-06, "loss": 1.2585, "step": 20047 }, { "epoch": 0.55, "learning_rate": 8.949378903321916e-06, "loss": 1.1677, "step": 20048 }, { "epoch": 0.55, "learning_rate": 8.948499295399982e-06, "loss": 1.3525, "step": 20049 }, { "epoch": 0.55, "learning_rate": 8.947619695704496e-06, "loss": 1.2888, "step": 20050 }, { "epoch": 0.55, "learning_rate": 8.946740104242337e-06, "loss": 1.2168, "step": 20051 }, { "epoch": 0.55, "learning_rate": 8.945860521020389e-06, "loss": 1.2939, "step": 20052 }, { "epoch": 0.55, "learning_rate": 8.944980946045532e-06, "loss": 1.2871, "step": 20053 }, { "epoch": 0.55, "learning_rate": 8.944101379324646e-06, "loss": 1.3308, "step": 20054 }, { "epoch": 0.55, "learning_rate": 8.943221820864618e-06, "loss": 1.2932, "step": 20055 }, { "epoch": 0.55, "learning_rate": 8.942342270672323e-06, "loss": 1.6758, "step": 20056 }, { "epoch": 0.55, "learning_rate": 8.941462728754647e-06, "loss": 1.302, "step": 20057 }, { "epoch": 0.55, "learning_rate": 8.940583195118467e-06, "loss": 1.3354, "step": 20058 }, { "epoch": 0.55, "learning_rate": 8.939703669770668e-06, "loss": 1.2393, "step": 20059 }, { "epoch": 0.55, "learning_rate": 8.938824152718125e-06, "loss": 1.2983, "step": 20060 }, { "epoch": 0.55, "learning_rate": 8.937944643967727e-06, "loss": 1.2283, "step": 20061 }, { "epoch": 0.55, "learning_rate": 8.937065143526349e-06, "loss": 1.2883, "step": 20062 }, { "epoch": 0.55, "learning_rate": 8.936185651400874e-06, "loss": 1.3079, "step": 20063 }, { "epoch": 0.55, "learning_rate": 8.935306167598178e-06, "loss": 1.3848, "step": 20064 }, { "epoch": 0.55, "learning_rate": 8.934426692125153e-06, "loss": 1.6797, "step": 20065 }, { "epoch": 0.55, "learning_rate": 8.933547224988666e-06, "loss": 1.2451, "step": 20066 }, { "epoch": 0.55, "learning_rate": 8.932667766195609e-06, "loss": 1.4575, "step": 20067 }, { "epoch": 0.55, "learning_rate": 8.931788315752853e-06, "loss": 1.4141, "step": 20068 }, { "epoch": 0.55, "learning_rate": 8.930908873667285e-06, "loss": 1.1819, "step": 20069 }, { "epoch": 0.55, "learning_rate": 8.930029439945784e-06, "loss": 1.4067, "step": 20070 }, { "epoch": 0.55, "learning_rate": 8.929150014595229e-06, "loss": 1.2756, "step": 20071 }, { "epoch": 0.55, "learning_rate": 8.928270597622502e-06, "loss": 1.2518, "step": 20072 }, { "epoch": 0.55, "learning_rate": 8.92739118903448e-06, "loss": 1.179, "step": 20073 }, { "epoch": 0.55, "learning_rate": 8.926511788838047e-06, "loss": 1.2535, "step": 20074 }, { "epoch": 0.55, "learning_rate": 8.925632397040078e-06, "loss": 1.3564, "step": 20075 }, { "epoch": 0.55, "learning_rate": 8.924753013647459e-06, "loss": 1.144, "step": 20076 }, { "epoch": 0.55, "learning_rate": 8.923873638667064e-06, "loss": 1.2566, "step": 20077 }, { "epoch": 0.55, "learning_rate": 8.922994272105778e-06, "loss": 1.624, "step": 20078 }, { "epoch": 0.55, "learning_rate": 8.922114913970477e-06, "loss": 1.6836, "step": 20079 }, { "epoch": 0.55, "learning_rate": 8.921235564268044e-06, "loss": 1.187, "step": 20080 }, { "epoch": 0.55, "learning_rate": 8.920356223005354e-06, "loss": 1.3291, "step": 20081 }, { "epoch": 0.55, "learning_rate": 8.919476890189292e-06, "loss": 1.1477, "step": 20082 }, { "epoch": 0.55, "learning_rate": 8.918597565826731e-06, "loss": 1.2019, "step": 20083 }, { "epoch": 0.55, "learning_rate": 8.917718249924556e-06, "loss": 1.3564, "step": 20084 }, { "epoch": 0.55, "learning_rate": 8.916838942489647e-06, "loss": 1.291, "step": 20085 }, { "epoch": 0.55, "learning_rate": 8.915959643528876e-06, "loss": 1.2556, "step": 20086 }, { "epoch": 0.55, "learning_rate": 8.915080353049132e-06, "loss": 1.3831, "step": 20087 }, { "epoch": 0.55, "learning_rate": 8.914201071057285e-06, "loss": 1.207, "step": 20088 }, { "epoch": 0.55, "learning_rate": 8.913321797560222e-06, "loss": 1.095, "step": 20089 }, { "epoch": 0.55, "learning_rate": 8.912442532564814e-06, "loss": 1.3679, "step": 20090 }, { "epoch": 0.55, "learning_rate": 8.911563276077948e-06, "loss": 1.333, "step": 20091 }, { "epoch": 0.55, "learning_rate": 8.910684028106497e-06, "loss": 1.2803, "step": 20092 }, { "epoch": 0.55, "learning_rate": 8.909804788657344e-06, "loss": 1.2898, "step": 20093 }, { "epoch": 0.55, "learning_rate": 8.908925557737362e-06, "loss": 1.2488, "step": 20094 }, { "epoch": 0.55, "learning_rate": 8.908046335353438e-06, "loss": 1.1895, "step": 20095 }, { "epoch": 0.55, "learning_rate": 8.907167121512441e-06, "loss": 1.4478, "step": 20096 }, { "epoch": 0.55, "learning_rate": 8.906287916221259e-06, "loss": 1.3457, "step": 20097 }, { "epoch": 0.55, "learning_rate": 8.905408719486763e-06, "loss": 1.3374, "step": 20098 }, { "epoch": 0.55, "learning_rate": 8.904529531315831e-06, "loss": 1.2673, "step": 20099 }, { "epoch": 0.55, "learning_rate": 8.903650351715353e-06, "loss": 1.3538, "step": 20100 }, { "epoch": 0.55, "learning_rate": 8.902771180692193e-06, "loss": 1.2209, "step": 20101 }, { "epoch": 0.55, "learning_rate": 8.901892018253242e-06, "loss": 1.3479, "step": 20102 }, { "epoch": 0.55, "learning_rate": 8.901012864405364e-06, "loss": 1.3083, "step": 20103 }, { "epoch": 0.55, "learning_rate": 8.900133719155451e-06, "loss": 1.2888, "step": 20104 }, { "epoch": 0.55, "learning_rate": 8.899254582510369e-06, "loss": 1.29, "step": 20105 }, { "epoch": 0.55, "learning_rate": 8.898375454477006e-06, "loss": 1.3174, "step": 20106 }, { "epoch": 0.55, "learning_rate": 8.89749633506223e-06, "loss": 1.2605, "step": 20107 }, { "epoch": 0.55, "learning_rate": 8.896617224272932e-06, "loss": 1.301, "step": 20108 }, { "epoch": 0.55, "learning_rate": 8.895738122115975e-06, "loss": 1.2461, "step": 20109 }, { "epoch": 0.55, "learning_rate": 8.89485902859825e-06, "loss": 1.8101, "step": 20110 }, { "epoch": 0.55, "learning_rate": 8.893979943726621e-06, "loss": 1.2483, "step": 20111 }, { "epoch": 0.55, "learning_rate": 8.89310086750798e-06, "loss": 1.1958, "step": 20112 }, { "epoch": 0.55, "learning_rate": 8.89222179994919e-06, "loss": 1.1128, "step": 20113 }, { "epoch": 0.55, "learning_rate": 8.891342741057142e-06, "loss": 1.178, "step": 20114 }, { "epoch": 0.55, "learning_rate": 8.890463690838702e-06, "loss": 1.3525, "step": 20115 }, { "epoch": 0.55, "learning_rate": 8.889584649300754e-06, "loss": 1.405, "step": 20116 }, { "epoch": 0.55, "learning_rate": 8.888705616450176e-06, "loss": 1.238, "step": 20117 }, { "epoch": 0.55, "learning_rate": 8.88782659229384e-06, "loss": 1.291, "step": 20118 }, { "epoch": 0.55, "learning_rate": 8.886947576838629e-06, "loss": 1.2615, "step": 20119 }, { "epoch": 0.55, "learning_rate": 8.886068570091412e-06, "loss": 1.4995, "step": 20120 }, { "epoch": 0.55, "learning_rate": 8.885189572059075e-06, "loss": 1.2695, "step": 20121 }, { "epoch": 0.55, "learning_rate": 8.88431058274849e-06, "loss": 1.3079, "step": 20122 }, { "epoch": 0.55, "learning_rate": 8.883431602166534e-06, "loss": 1.3857, "step": 20123 }, { "epoch": 0.55, "learning_rate": 8.882552630320082e-06, "loss": 1.7656, "step": 20124 }, { "epoch": 0.55, "learning_rate": 8.881673667216016e-06, "loss": 1.4458, "step": 20125 }, { "epoch": 0.55, "learning_rate": 8.880794712861206e-06, "loss": 1.1526, "step": 20126 }, { "epoch": 0.55, "learning_rate": 8.879915767262534e-06, "loss": 1.2573, "step": 20127 }, { "epoch": 0.55, "learning_rate": 8.879036830426872e-06, "loss": 1.3296, "step": 20128 }, { "epoch": 0.55, "learning_rate": 8.878157902361102e-06, "loss": 1.7412, "step": 20129 }, { "epoch": 0.55, "learning_rate": 8.877278983072095e-06, "loss": 1.2629, "step": 20130 }, { "epoch": 0.55, "learning_rate": 8.876400072566729e-06, "loss": 1.2949, "step": 20131 }, { "epoch": 0.55, "learning_rate": 8.875521170851883e-06, "loss": 1.2263, "step": 20132 }, { "epoch": 0.55, "learning_rate": 8.874642277934427e-06, "loss": 1.3733, "step": 20133 }, { "epoch": 0.55, "learning_rate": 8.873763393821243e-06, "loss": 1.2939, "step": 20134 }, { "epoch": 0.55, "learning_rate": 8.872884518519203e-06, "loss": 1.2412, "step": 20135 }, { "epoch": 0.55, "learning_rate": 8.872005652035188e-06, "loss": 1.3044, "step": 20136 }, { "epoch": 0.55, "learning_rate": 8.871126794376067e-06, "loss": 1.1365, "step": 20137 }, { "epoch": 0.55, "learning_rate": 8.87024794554872e-06, "loss": 1.3271, "step": 20138 }, { "epoch": 0.55, "learning_rate": 8.869369105560021e-06, "loss": 1.2749, "step": 20139 }, { "epoch": 0.55, "learning_rate": 8.86849027441685e-06, "loss": 1.3672, "step": 20140 }, { "epoch": 0.55, "learning_rate": 8.867611452126075e-06, "loss": 1.1631, "step": 20141 }, { "epoch": 0.55, "learning_rate": 8.866732638694579e-06, "loss": 1.3684, "step": 20142 }, { "epoch": 0.55, "learning_rate": 8.86585383412923e-06, "loss": 1.2642, "step": 20143 }, { "epoch": 0.55, "learning_rate": 8.86497503843691e-06, "loss": 1.2485, "step": 20144 }, { "epoch": 0.55, "learning_rate": 8.86409625162449e-06, "loss": 1.2256, "step": 20145 }, { "epoch": 0.55, "learning_rate": 8.863217473698844e-06, "loss": 1.3274, "step": 20146 }, { "epoch": 0.55, "learning_rate": 8.862338704666857e-06, "loss": 1.21, "step": 20147 }, { "epoch": 0.55, "learning_rate": 8.86145994453539e-06, "loss": 1.1836, "step": 20148 }, { "epoch": 0.55, "learning_rate": 8.860581193311332e-06, "loss": 1.2505, "step": 20149 }, { "epoch": 0.55, "learning_rate": 8.859702451001544e-06, "loss": 1.2595, "step": 20150 }, { "epoch": 0.55, "learning_rate": 8.858823717612915e-06, "loss": 1.2744, "step": 20151 }, { "epoch": 0.55, "learning_rate": 8.857944993152305e-06, "loss": 1.2363, "step": 20152 }, { "epoch": 0.55, "learning_rate": 8.857066277626604e-06, "loss": 1.3735, "step": 20153 }, { "epoch": 0.55, "learning_rate": 8.856187571042672e-06, "loss": 1.3059, "step": 20154 }, { "epoch": 0.55, "learning_rate": 8.855308873407398e-06, "loss": 1.3298, "step": 20155 }, { "epoch": 0.55, "learning_rate": 8.854430184727642e-06, "loss": 1.2185, "step": 20156 }, { "epoch": 0.55, "learning_rate": 8.853551505010291e-06, "loss": 1.4155, "step": 20157 }, { "epoch": 0.55, "learning_rate": 8.852672834262209e-06, "loss": 1.3555, "step": 20158 }, { "epoch": 0.55, "learning_rate": 8.85179417249028e-06, "loss": 1.28, "step": 20159 }, { "epoch": 0.55, "learning_rate": 8.850915519701369e-06, "loss": 1.2507, "step": 20160 }, { "epoch": 0.55, "learning_rate": 8.850036875902354e-06, "loss": 1.3555, "step": 20161 }, { "epoch": 0.55, "learning_rate": 8.849158241100114e-06, "loss": 1.2581, "step": 20162 }, { "epoch": 0.55, "learning_rate": 8.848279615301517e-06, "loss": 1.1348, "step": 20163 }, { "epoch": 0.55, "learning_rate": 8.84740099851344e-06, "loss": 1.1689, "step": 20164 }, { "epoch": 0.55, "learning_rate": 8.846522390742754e-06, "loss": 1.2852, "step": 20165 }, { "epoch": 0.55, "learning_rate": 8.845643791996336e-06, "loss": 1.2844, "step": 20166 }, { "epoch": 0.55, "learning_rate": 8.844765202281056e-06, "loss": 1.1355, "step": 20167 }, { "epoch": 0.55, "learning_rate": 8.843886621603792e-06, "loss": 1.1924, "step": 20168 }, { "epoch": 0.55, "learning_rate": 8.843008049971414e-06, "loss": 1.3245, "step": 20169 }, { "epoch": 0.55, "learning_rate": 8.842129487390798e-06, "loss": 1.4312, "step": 20170 }, { "epoch": 0.55, "learning_rate": 8.841250933868815e-06, "loss": 1.3835, "step": 20171 }, { "epoch": 0.55, "learning_rate": 8.840372389412341e-06, "loss": 1.2273, "step": 20172 }, { "epoch": 0.55, "learning_rate": 8.839493854028247e-06, "loss": 1.5081, "step": 20173 }, { "epoch": 0.55, "learning_rate": 8.838615327723408e-06, "loss": 1.498, "step": 20174 }, { "epoch": 0.55, "learning_rate": 8.837736810504697e-06, "loss": 1.1794, "step": 20175 }, { "epoch": 0.55, "learning_rate": 8.836858302378987e-06, "loss": 1.2888, "step": 20176 }, { "epoch": 0.55, "learning_rate": 8.835979803353148e-06, "loss": 1.1174, "step": 20177 }, { "epoch": 0.55, "learning_rate": 8.835101313434058e-06, "loss": 1.2678, "step": 20178 }, { "epoch": 0.55, "learning_rate": 8.834222832628587e-06, "loss": 1.2927, "step": 20179 }, { "epoch": 0.55, "learning_rate": 8.833344360943608e-06, "loss": 1.079, "step": 20180 }, { "epoch": 0.55, "learning_rate": 8.832465898385995e-06, "loss": 1.3115, "step": 20181 }, { "epoch": 0.55, "learning_rate": 8.831587444962619e-06, "loss": 1.2637, "step": 20182 }, { "epoch": 0.55, "learning_rate": 8.830709000680355e-06, "loss": 1.1833, "step": 20183 }, { "epoch": 0.55, "learning_rate": 8.829830565546072e-06, "loss": 1.3193, "step": 20184 }, { "epoch": 0.55, "learning_rate": 8.828952139566647e-06, "loss": 1.3965, "step": 20185 }, { "epoch": 0.55, "learning_rate": 8.828073722748947e-06, "loss": 1.1394, "step": 20186 }, { "epoch": 0.55, "learning_rate": 8.827195315099848e-06, "loss": 1.467, "step": 20187 }, { "epoch": 0.55, "learning_rate": 8.826316916626222e-06, "loss": 1.1819, "step": 20188 }, { "epoch": 0.55, "learning_rate": 8.825438527334941e-06, "loss": 1.1816, "step": 20189 }, { "epoch": 0.55, "learning_rate": 8.824560147232875e-06, "loss": 1.3379, "step": 20190 }, { "epoch": 0.55, "learning_rate": 8.823681776326899e-06, "loss": 1.2651, "step": 20191 }, { "epoch": 0.55, "learning_rate": 8.822803414623882e-06, "loss": 1.3916, "step": 20192 }, { "epoch": 0.55, "learning_rate": 8.821925062130694e-06, "loss": 1.2434, "step": 20193 }, { "epoch": 0.55, "learning_rate": 8.82104671885422e-06, "loss": 1.3203, "step": 20194 }, { "epoch": 0.55, "learning_rate": 8.820168384801313e-06, "loss": 1.3318, "step": 20195 }, { "epoch": 0.55, "learning_rate": 8.819290059978862e-06, "loss": 1.3777, "step": 20196 }, { "epoch": 0.55, "learning_rate": 8.818411744393722e-06, "loss": 1.3667, "step": 20197 }, { "epoch": 0.55, "learning_rate": 8.81753343805278e-06, "loss": 1.4065, "step": 20198 }, { "epoch": 0.55, "learning_rate": 8.816655140962894e-06, "loss": 1.3254, "step": 20199 }, { "epoch": 0.55, "learning_rate": 8.815776853130948e-06, "loss": 1.1897, "step": 20200 }, { "epoch": 0.55, "learning_rate": 8.814898574563802e-06, "loss": 1.1819, "step": 20201 }, { "epoch": 0.55, "learning_rate": 8.814020305268337e-06, "loss": 1.155, "step": 20202 }, { "epoch": 0.55, "learning_rate": 8.813142045251414e-06, "loss": 1.4094, "step": 20203 }, { "epoch": 0.55, "learning_rate": 8.812263794519916e-06, "loss": 1.2415, "step": 20204 }, { "epoch": 0.55, "learning_rate": 8.8113855530807e-06, "loss": 1.218, "step": 20205 }, { "epoch": 0.55, "learning_rate": 8.810507320940652e-06, "loss": 1.3481, "step": 20206 }, { "epoch": 0.55, "learning_rate": 8.80962909810663e-06, "loss": 1.3118, "step": 20207 }, { "epoch": 0.55, "learning_rate": 8.80875088458551e-06, "loss": 1.1877, "step": 20208 }, { "epoch": 0.55, "learning_rate": 8.807872680384166e-06, "loss": 1.2148, "step": 20209 }, { "epoch": 0.55, "learning_rate": 8.806994485509464e-06, "loss": 1.377, "step": 20210 }, { "epoch": 0.55, "learning_rate": 8.806116299968277e-06, "loss": 1.3167, "step": 20211 }, { "epoch": 0.55, "learning_rate": 8.805238123767474e-06, "loss": 1.1406, "step": 20212 }, { "epoch": 0.55, "learning_rate": 8.804359956913926e-06, "loss": 1.3821, "step": 20213 }, { "epoch": 0.55, "learning_rate": 8.803481799414504e-06, "loss": 1.342, "step": 20214 }, { "epoch": 0.55, "learning_rate": 8.802603651276079e-06, "loss": 1.3369, "step": 20215 }, { "epoch": 0.55, "learning_rate": 8.801725512505517e-06, "loss": 1.2302, "step": 20216 }, { "epoch": 0.55, "learning_rate": 8.800847383109694e-06, "loss": 1.311, "step": 20217 }, { "epoch": 0.55, "learning_rate": 8.799969263095475e-06, "loss": 1.4016, "step": 20218 }, { "epoch": 0.55, "learning_rate": 8.799091152469734e-06, "loss": 1.2441, "step": 20219 }, { "epoch": 0.55, "learning_rate": 8.798213051239338e-06, "loss": 1.2351, "step": 20220 }, { "epoch": 0.55, "learning_rate": 8.797334959411159e-06, "loss": 1.2812, "step": 20221 }, { "epoch": 0.55, "learning_rate": 8.796456876992063e-06, "loss": 1.3818, "step": 20222 }, { "epoch": 0.55, "learning_rate": 8.795578803988924e-06, "loss": 1.2224, "step": 20223 }, { "epoch": 0.55, "learning_rate": 8.794700740408612e-06, "loss": 1.4814, "step": 20224 }, { "epoch": 0.55, "learning_rate": 8.793822686257992e-06, "loss": 1.1061, "step": 20225 }, { "epoch": 0.55, "learning_rate": 8.792944641543937e-06, "loss": 1.3604, "step": 20226 }, { "epoch": 0.55, "learning_rate": 8.792066606273316e-06, "loss": 1.3313, "step": 20227 }, { "epoch": 0.55, "learning_rate": 8.791188580452999e-06, "loss": 1.3306, "step": 20228 }, { "epoch": 0.55, "learning_rate": 8.790310564089852e-06, "loss": 1.3408, "step": 20229 }, { "epoch": 0.55, "learning_rate": 8.789432557190746e-06, "loss": 1.3027, "step": 20230 }, { "epoch": 0.55, "learning_rate": 8.788554559762552e-06, "loss": 1.147, "step": 20231 }, { "epoch": 0.55, "learning_rate": 8.787676571812139e-06, "loss": 1.2092, "step": 20232 }, { "epoch": 0.55, "learning_rate": 8.78679859334637e-06, "loss": 1.6797, "step": 20233 }, { "epoch": 0.55, "learning_rate": 8.785920624372122e-06, "loss": 1.3931, "step": 20234 }, { "epoch": 0.55, "learning_rate": 8.785042664896257e-06, "loss": 1.342, "step": 20235 }, { "epoch": 0.55, "learning_rate": 8.78416471492565e-06, "loss": 1.7104, "step": 20236 }, { "epoch": 0.55, "learning_rate": 8.783286774467165e-06, "loss": 1.3149, "step": 20237 }, { "epoch": 0.55, "learning_rate": 8.782408843527674e-06, "loss": 1.3186, "step": 20238 }, { "epoch": 0.55, "learning_rate": 8.78153092211404e-06, "loss": 1.2593, "step": 20239 }, { "epoch": 0.55, "learning_rate": 8.780653010233134e-06, "loss": 1.2212, "step": 20240 }, { "epoch": 0.55, "learning_rate": 8.779775107891833e-06, "loss": 1.2805, "step": 20241 }, { "epoch": 0.55, "learning_rate": 8.778897215096988e-06, "loss": 1.3237, "step": 20242 }, { "epoch": 0.55, "learning_rate": 8.778019331855486e-06, "loss": 1.3372, "step": 20243 }, { "epoch": 0.55, "learning_rate": 8.77714145817418e-06, "loss": 1.4077, "step": 20244 }, { "epoch": 0.55, "learning_rate": 8.77626359405995e-06, "loss": 1.7349, "step": 20245 }, { "epoch": 0.55, "learning_rate": 8.775385739519651e-06, "loss": 1.2014, "step": 20246 }, { "epoch": 0.55, "learning_rate": 8.774507894560165e-06, "loss": 1.3928, "step": 20247 }, { "epoch": 0.55, "learning_rate": 8.773630059188347e-06, "loss": 1.2532, "step": 20248 }, { "epoch": 0.55, "learning_rate": 8.772752233411078e-06, "loss": 1.27, "step": 20249 }, { "epoch": 0.55, "learning_rate": 8.771874417235211e-06, "loss": 1.2461, "step": 20250 }, { "epoch": 0.55, "learning_rate": 8.770996610667628e-06, "loss": 1.2432, "step": 20251 }, { "epoch": 0.55, "learning_rate": 8.770118813715181e-06, "loss": 1.1968, "step": 20252 }, { "epoch": 0.55, "learning_rate": 8.769241026384756e-06, "loss": 1.3264, "step": 20253 }, { "epoch": 0.55, "learning_rate": 8.768363248683201e-06, "loss": 1.3743, "step": 20254 }, { "epoch": 0.55, "learning_rate": 8.767485480617397e-06, "loss": 1.0253, "step": 20255 }, { "epoch": 0.55, "learning_rate": 8.766607722194207e-06, "loss": 1.3396, "step": 20256 }, { "epoch": 0.55, "learning_rate": 8.765729973420498e-06, "loss": 1.2715, "step": 20257 }, { "epoch": 0.55, "learning_rate": 8.764852234303139e-06, "loss": 1.0471, "step": 20258 }, { "epoch": 0.55, "learning_rate": 8.763974504848992e-06, "loss": 1.3047, "step": 20259 }, { "epoch": 0.55, "learning_rate": 8.76309678506493e-06, "loss": 1.239, "step": 20260 }, { "epoch": 0.55, "learning_rate": 8.762219074957816e-06, "loss": 1.2241, "step": 20261 }, { "epoch": 0.55, "learning_rate": 8.761341374534519e-06, "loss": 1.3042, "step": 20262 }, { "epoch": 0.55, "learning_rate": 8.760463683801903e-06, "loss": 1.3169, "step": 20263 }, { "epoch": 0.55, "learning_rate": 8.759586002766838e-06, "loss": 1.376, "step": 20264 }, { "epoch": 0.55, "learning_rate": 8.758708331436188e-06, "loss": 1.2712, "step": 20265 }, { "epoch": 0.55, "learning_rate": 8.75783066981682e-06, "loss": 1.397, "step": 20266 }, { "epoch": 0.55, "learning_rate": 8.756953017915601e-06, "loss": 1.4514, "step": 20267 }, { "epoch": 0.55, "learning_rate": 8.756075375739398e-06, "loss": 1.098, "step": 20268 }, { "epoch": 0.55, "learning_rate": 8.755197743295075e-06, "loss": 1.1296, "step": 20269 }, { "epoch": 0.55, "learning_rate": 8.754320120589497e-06, "loss": 1.3936, "step": 20270 }, { "epoch": 0.55, "learning_rate": 8.753442507629539e-06, "loss": 1.24, "step": 20271 }, { "epoch": 0.55, "learning_rate": 8.752564904422055e-06, "loss": 1.1586, "step": 20272 }, { "epoch": 0.55, "learning_rate": 8.75168731097392e-06, "loss": 1.2712, "step": 20273 }, { "epoch": 0.55, "learning_rate": 8.750809727291995e-06, "loss": 1.7417, "step": 20274 }, { "epoch": 0.55, "learning_rate": 8.749932153383149e-06, "loss": 1.4084, "step": 20275 }, { "epoch": 0.55, "learning_rate": 8.749054589254243e-06, "loss": 1.3835, "step": 20276 }, { "epoch": 0.55, "learning_rate": 8.748177034912148e-06, "loss": 1.3005, "step": 20277 }, { "epoch": 0.55, "learning_rate": 8.747299490363725e-06, "loss": 1.0898, "step": 20278 }, { "epoch": 0.55, "learning_rate": 8.746421955615845e-06, "loss": 1.2188, "step": 20279 }, { "epoch": 0.55, "learning_rate": 8.745544430675367e-06, "loss": 1.3657, "step": 20280 }, { "epoch": 0.55, "learning_rate": 8.744666915549161e-06, "loss": 1.1611, "step": 20281 }, { "epoch": 0.55, "learning_rate": 8.74378941024409e-06, "loss": 1.3599, "step": 20282 }, { "epoch": 0.55, "learning_rate": 8.742911914767022e-06, "loss": 1.2666, "step": 20283 }, { "epoch": 0.55, "learning_rate": 8.742034429124818e-06, "loss": 1.217, "step": 20284 }, { "epoch": 0.55, "learning_rate": 8.741156953324342e-06, "loss": 1.0969, "step": 20285 }, { "epoch": 0.55, "learning_rate": 8.740279487372469e-06, "loss": 1.2019, "step": 20286 }, { "epoch": 0.55, "learning_rate": 8.73940203127605e-06, "loss": 1.0551, "step": 20287 }, { "epoch": 0.55, "learning_rate": 8.738524585041964e-06, "loss": 1.3176, "step": 20288 }, { "epoch": 0.55, "learning_rate": 8.737647148677062e-06, "loss": 1.3372, "step": 20289 }, { "epoch": 0.55, "learning_rate": 8.73676972218822e-06, "loss": 1.3413, "step": 20290 }, { "epoch": 0.55, "learning_rate": 8.735892305582293e-06, "loss": 1.3975, "step": 20291 }, { "epoch": 0.55, "learning_rate": 8.735014898866156e-06, "loss": 1.0999, "step": 20292 }, { "epoch": 0.55, "learning_rate": 8.734137502046661e-06, "loss": 1.3091, "step": 20293 }, { "epoch": 0.55, "learning_rate": 8.733260115130684e-06, "loss": 1.2527, "step": 20294 }, { "epoch": 0.55, "learning_rate": 8.732382738125082e-06, "loss": 1.1958, "step": 20295 }, { "epoch": 0.55, "learning_rate": 8.731505371036723e-06, "loss": 1.1753, "step": 20296 }, { "epoch": 0.55, "learning_rate": 8.730628013872466e-06, "loss": 1.304, "step": 20297 }, { "epoch": 0.55, "learning_rate": 8.729750666639182e-06, "loss": 1.3274, "step": 20298 }, { "epoch": 0.55, "learning_rate": 8.72887332934373e-06, "loss": 1.3779, "step": 20299 }, { "epoch": 0.55, "learning_rate": 8.727996001992976e-06, "loss": 1.1765, "step": 20300 }, { "epoch": 0.55, "learning_rate": 8.727118684593782e-06, "loss": 1.2249, "step": 20301 }, { "epoch": 0.55, "learning_rate": 8.726241377153012e-06, "loss": 1.1853, "step": 20302 }, { "epoch": 0.55, "learning_rate": 8.725364079677534e-06, "loss": 1.1313, "step": 20303 }, { "epoch": 0.55, "learning_rate": 8.724486792174205e-06, "loss": 1.3167, "step": 20304 }, { "epoch": 0.55, "learning_rate": 8.723609514649894e-06, "loss": 1.2524, "step": 20305 }, { "epoch": 0.55, "learning_rate": 8.72273224711146e-06, "loss": 1.1938, "step": 20306 }, { "epoch": 0.55, "learning_rate": 8.721854989565771e-06, "loss": 1.2451, "step": 20307 }, { "epoch": 0.55, "learning_rate": 8.720977742019683e-06, "loss": 1.2153, "step": 20308 }, { "epoch": 0.55, "learning_rate": 8.720100504480069e-06, "loss": 1.3523, "step": 20309 }, { "epoch": 0.55, "learning_rate": 8.719223276953782e-06, "loss": 1.7388, "step": 20310 }, { "epoch": 0.55, "learning_rate": 8.718346059447695e-06, "loss": 1.2683, "step": 20311 }, { "epoch": 0.55, "learning_rate": 8.71746885196866e-06, "loss": 1.2246, "step": 20312 }, { "epoch": 0.55, "learning_rate": 8.71659165452355e-06, "loss": 1.2739, "step": 20313 }, { "epoch": 0.55, "learning_rate": 8.715714467119221e-06, "loss": 1.2805, "step": 20314 }, { "epoch": 0.55, "learning_rate": 8.71483728976254e-06, "loss": 1.1726, "step": 20315 }, { "epoch": 0.55, "learning_rate": 8.713960122460365e-06, "loss": 1.2795, "step": 20316 }, { "epoch": 0.55, "learning_rate": 8.713082965219562e-06, "loss": 1.2522, "step": 20317 }, { "epoch": 0.55, "learning_rate": 8.712205818046995e-06, "loss": 1.3738, "step": 20318 }, { "epoch": 0.55, "learning_rate": 8.711328680949521e-06, "loss": 1.3535, "step": 20319 }, { "epoch": 0.55, "learning_rate": 8.710451553934008e-06, "loss": 1.1658, "step": 20320 }, { "epoch": 0.55, "learning_rate": 8.709574437007312e-06, "loss": 1.3167, "step": 20321 }, { "epoch": 0.55, "learning_rate": 8.708697330176304e-06, "loss": 1.3779, "step": 20322 }, { "epoch": 0.56, "learning_rate": 8.707820233447838e-06, "loss": 1.2588, "step": 20323 }, { "epoch": 0.56, "learning_rate": 8.70694314682878e-06, "loss": 1.4348, "step": 20324 }, { "epoch": 0.56, "learning_rate": 8.70606607032599e-06, "loss": 1.2061, "step": 20325 }, { "epoch": 0.56, "learning_rate": 8.70518900394633e-06, "loss": 1.2439, "step": 20326 }, { "epoch": 0.56, "learning_rate": 8.704311947696661e-06, "loss": 1.1772, "step": 20327 }, { "epoch": 0.56, "learning_rate": 8.703434901583851e-06, "loss": 1.1335, "step": 20328 }, { "epoch": 0.56, "learning_rate": 8.70255786561475e-06, "loss": 1.3215, "step": 20329 }, { "epoch": 0.56, "learning_rate": 8.701680839796234e-06, "loss": 1.3757, "step": 20330 }, { "epoch": 0.56, "learning_rate": 8.70080382413515e-06, "loss": 1.3303, "step": 20331 }, { "epoch": 0.56, "learning_rate": 8.699926818638367e-06, "loss": 1.3625, "step": 20332 }, { "epoch": 0.56, "learning_rate": 8.699049823312747e-06, "loss": 1.4473, "step": 20333 }, { "epoch": 0.56, "learning_rate": 8.698172838165148e-06, "loss": 1.1421, "step": 20334 }, { "epoch": 0.56, "learning_rate": 8.697295863202435e-06, "loss": 1.3, "step": 20335 }, { "epoch": 0.56, "learning_rate": 8.696418898431465e-06, "loss": 1.2444, "step": 20336 }, { "epoch": 0.56, "learning_rate": 8.6955419438591e-06, "loss": 1.1968, "step": 20337 }, { "epoch": 0.56, "learning_rate": 8.694664999492201e-06, "loss": 1.1377, "step": 20338 }, { "epoch": 0.56, "learning_rate": 8.693788065337633e-06, "loss": 1.0208, "step": 20339 }, { "epoch": 0.56, "learning_rate": 8.69291114140225e-06, "loss": 1.2468, "step": 20340 }, { "epoch": 0.56, "learning_rate": 8.692034227692916e-06, "loss": 1.3254, "step": 20341 }, { "epoch": 0.56, "learning_rate": 8.69115732421649e-06, "loss": 1.0981, "step": 20342 }, { "epoch": 0.56, "learning_rate": 8.690280430979836e-06, "loss": 1.2336, "step": 20343 }, { "epoch": 0.56, "learning_rate": 8.68940354798981e-06, "loss": 1.2285, "step": 20344 }, { "epoch": 0.56, "learning_rate": 8.688526675253276e-06, "loss": 1.1362, "step": 20345 }, { "epoch": 0.56, "learning_rate": 8.68764981277709e-06, "loss": 1.2244, "step": 20346 }, { "epoch": 0.56, "learning_rate": 8.686772960568117e-06, "loss": 1.2205, "step": 20347 }, { "epoch": 0.56, "learning_rate": 8.685896118633215e-06, "loss": 1.2007, "step": 20348 }, { "epoch": 0.56, "learning_rate": 8.685019286979241e-06, "loss": 1.1865, "step": 20349 }, { "epoch": 0.56, "learning_rate": 8.684142465613063e-06, "loss": 1.3044, "step": 20350 }, { "epoch": 0.56, "learning_rate": 8.68326565454153e-06, "loss": 1.3455, "step": 20351 }, { "epoch": 0.56, "learning_rate": 8.682388853771512e-06, "loss": 1.3601, "step": 20352 }, { "epoch": 0.56, "learning_rate": 8.68151206330986e-06, "loss": 1.2551, "step": 20353 }, { "epoch": 0.56, "learning_rate": 8.680635283163442e-06, "loss": 1.3486, "step": 20354 }, { "epoch": 0.56, "learning_rate": 8.679758513339108e-06, "loss": 1.1743, "step": 20355 }, { "epoch": 0.56, "learning_rate": 8.678881753843726e-06, "loss": 1.4084, "step": 20356 }, { "epoch": 0.56, "learning_rate": 8.67800500468415e-06, "loss": 1.3826, "step": 20357 }, { "epoch": 0.56, "learning_rate": 8.677128265867246e-06, "loss": 1.2161, "step": 20358 }, { "epoch": 0.56, "learning_rate": 8.676251537399863e-06, "loss": 1.2031, "step": 20359 }, { "epoch": 0.56, "learning_rate": 8.675374819288868e-06, "loss": 1.2136, "step": 20360 }, { "epoch": 0.56, "learning_rate": 8.674498111541116e-06, "loss": 1.4148, "step": 20361 }, { "epoch": 0.56, "learning_rate": 8.673621414163468e-06, "loss": 1.1096, "step": 20362 }, { "epoch": 0.56, "learning_rate": 8.672744727162782e-06, "loss": 1.4172, "step": 20363 }, { "epoch": 0.56, "learning_rate": 8.671868050545915e-06, "loss": 1.198, "step": 20364 }, { "epoch": 0.56, "learning_rate": 8.670991384319733e-06, "loss": 1.2927, "step": 20365 }, { "epoch": 0.56, "learning_rate": 8.670114728491085e-06, "loss": 1.1843, "step": 20366 }, { "epoch": 0.56, "learning_rate": 8.66923808306684e-06, "loss": 1.3596, "step": 20367 }, { "epoch": 0.56, "learning_rate": 8.66836144805384e-06, "loss": 1.0476, "step": 20368 }, { "epoch": 0.56, "learning_rate": 8.667484823458966e-06, "loss": 1.2534, "step": 20369 }, { "epoch": 0.56, "learning_rate": 8.666608209289054e-06, "loss": 1.2527, "step": 20370 }, { "epoch": 0.56, "learning_rate": 8.665731605550981e-06, "loss": 1.2678, "step": 20371 }, { "epoch": 0.56, "learning_rate": 8.664855012251589e-06, "loss": 1.4309, "step": 20372 }, { "epoch": 0.56, "learning_rate": 8.66397842939775e-06, "loss": 1.218, "step": 20373 }, { "epoch": 0.56, "learning_rate": 8.66310185699631e-06, "loss": 1.3247, "step": 20374 }, { "epoch": 0.56, "learning_rate": 8.662225295054139e-06, "loss": 1.2178, "step": 20375 }, { "epoch": 0.56, "learning_rate": 8.66134874357808e-06, "loss": 1.3979, "step": 20376 }, { "epoch": 0.56, "learning_rate": 8.660472202575007e-06, "loss": 1.7534, "step": 20377 }, { "epoch": 0.56, "learning_rate": 8.659595672051762e-06, "loss": 1.3372, "step": 20378 }, { "epoch": 0.56, "learning_rate": 8.658719152015213e-06, "loss": 1.3118, "step": 20379 }, { "epoch": 0.56, "learning_rate": 8.657842642472216e-06, "loss": 1.3098, "step": 20380 }, { "epoch": 0.56, "learning_rate": 8.656966143429626e-06, "loss": 1.1987, "step": 20381 }, { "epoch": 0.56, "learning_rate": 8.656089654894302e-06, "loss": 1.3838, "step": 20382 }, { "epoch": 0.56, "learning_rate": 8.655213176873099e-06, "loss": 1.3232, "step": 20383 }, { "epoch": 0.56, "learning_rate": 8.65433670937288e-06, "loss": 1.2607, "step": 20384 }, { "epoch": 0.56, "learning_rate": 8.653460252400494e-06, "loss": 1.4165, "step": 20385 }, { "epoch": 0.56, "learning_rate": 8.652583805962802e-06, "loss": 1.7236, "step": 20386 }, { "epoch": 0.56, "learning_rate": 8.651707370066661e-06, "loss": 1.1387, "step": 20387 }, { "epoch": 0.56, "learning_rate": 8.65083094471893e-06, "loss": 1.188, "step": 20388 }, { "epoch": 0.56, "learning_rate": 8.649954529926459e-06, "loss": 1.2151, "step": 20389 }, { "epoch": 0.56, "learning_rate": 8.649078125696113e-06, "loss": 1.1384, "step": 20390 }, { "epoch": 0.56, "learning_rate": 8.648201732034742e-06, "loss": 1.4048, "step": 20391 }, { "epoch": 0.56, "learning_rate": 8.647325348949207e-06, "loss": 1.4243, "step": 20392 }, { "epoch": 0.56, "learning_rate": 8.64644897644636e-06, "loss": 1.2778, "step": 20393 }, { "epoch": 0.56, "learning_rate": 8.64557261453306e-06, "loss": 1.283, "step": 20394 }, { "epoch": 0.56, "learning_rate": 8.644696263216164e-06, "loss": 1.4761, "step": 20395 }, { "epoch": 0.56, "learning_rate": 8.643819922502526e-06, "loss": 1.2922, "step": 20396 }, { "epoch": 0.56, "learning_rate": 8.642943592399005e-06, "loss": 1.3545, "step": 20397 }, { "epoch": 0.56, "learning_rate": 8.642067272912453e-06, "loss": 1.3257, "step": 20398 }, { "epoch": 0.56, "learning_rate": 8.641190964049731e-06, "loss": 1.2844, "step": 20399 }, { "epoch": 0.56, "learning_rate": 8.64031466581769e-06, "loss": 1.3591, "step": 20400 }, { "epoch": 0.56, "learning_rate": 8.639438378223189e-06, "loss": 1.1572, "step": 20401 }, { "epoch": 0.56, "learning_rate": 8.63856210127308e-06, "loss": 1.2285, "step": 20402 }, { "epoch": 0.56, "learning_rate": 8.637685834974223e-06, "loss": 1.3455, "step": 20403 }, { "epoch": 0.56, "learning_rate": 8.63680957933347e-06, "loss": 1.1619, "step": 20404 }, { "epoch": 0.56, "learning_rate": 8.63593333435768e-06, "loss": 1.3098, "step": 20405 }, { "epoch": 0.56, "learning_rate": 8.635057100053704e-06, "loss": 1.2339, "step": 20406 }, { "epoch": 0.56, "learning_rate": 8.6341808764284e-06, "loss": 1.1655, "step": 20407 }, { "epoch": 0.56, "learning_rate": 8.633304663488622e-06, "loss": 1.2698, "step": 20408 }, { "epoch": 0.56, "learning_rate": 8.632428461241228e-06, "loss": 1.3032, "step": 20409 }, { "epoch": 0.56, "learning_rate": 8.631552269693067e-06, "loss": 1.1812, "step": 20410 }, { "epoch": 0.56, "learning_rate": 8.630676088850996e-06, "loss": 1.3501, "step": 20411 }, { "epoch": 0.56, "learning_rate": 8.62979991872188e-06, "loss": 1.2349, "step": 20412 }, { "epoch": 0.56, "learning_rate": 8.628923759312556e-06, "loss": 1.3945, "step": 20413 }, { "epoch": 0.56, "learning_rate": 8.628047610629895e-06, "loss": 1.322, "step": 20414 }, { "epoch": 0.56, "learning_rate": 8.627171472680738e-06, "loss": 1.1764, "step": 20415 }, { "epoch": 0.56, "learning_rate": 8.626295345471953e-06, "loss": 1.3369, "step": 20416 }, { "epoch": 0.56, "learning_rate": 8.62541922901038e-06, "loss": 1.1687, "step": 20417 }, { "epoch": 0.56, "learning_rate": 8.624543123302887e-06, "loss": 1.3206, "step": 20418 }, { "epoch": 0.56, "learning_rate": 8.623667028356315e-06, "loss": 1.4954, "step": 20419 }, { "epoch": 0.56, "learning_rate": 8.622790944177532e-06, "loss": 1.3203, "step": 20420 }, { "epoch": 0.56, "learning_rate": 8.62191487077338e-06, "loss": 1.3608, "step": 20421 }, { "epoch": 0.56, "learning_rate": 8.621038808150721e-06, "loss": 1.0974, "step": 20422 }, { "epoch": 0.56, "learning_rate": 8.620162756316403e-06, "loss": 1.3406, "step": 20423 }, { "epoch": 0.56, "learning_rate": 8.619286715277286e-06, "loss": 1.4077, "step": 20424 }, { "epoch": 0.56, "learning_rate": 8.618410685040216e-06, "loss": 1.3215, "step": 20425 }, { "epoch": 0.56, "learning_rate": 8.617534665612052e-06, "loss": 1.6069, "step": 20426 }, { "epoch": 0.56, "learning_rate": 8.616658656999652e-06, "loss": 1.2749, "step": 20427 }, { "epoch": 0.56, "learning_rate": 8.61578265920986e-06, "loss": 1.2278, "step": 20428 }, { "epoch": 0.56, "learning_rate": 8.614906672249534e-06, "loss": 1.2927, "step": 20429 }, { "epoch": 0.56, "learning_rate": 8.614030696125526e-06, "loss": 1.2397, "step": 20430 }, { "epoch": 0.56, "learning_rate": 8.613154730844694e-06, "loss": 1.4102, "step": 20431 }, { "epoch": 0.56, "learning_rate": 8.612278776413883e-06, "loss": 1.2673, "step": 20432 }, { "epoch": 0.56, "learning_rate": 8.611402832839954e-06, "loss": 1.2493, "step": 20433 }, { "epoch": 0.56, "learning_rate": 8.610526900129752e-06, "loss": 1.2305, "step": 20434 }, { "epoch": 0.56, "learning_rate": 8.609650978290138e-06, "loss": 1.3186, "step": 20435 }, { "epoch": 0.56, "learning_rate": 8.608775067327958e-06, "loss": 1.2888, "step": 20436 }, { "epoch": 0.56, "learning_rate": 8.60789916725007e-06, "loss": 1.1277, "step": 20437 }, { "epoch": 0.56, "learning_rate": 8.607023278063324e-06, "loss": 1.2559, "step": 20438 }, { "epoch": 0.56, "learning_rate": 8.606147399774573e-06, "loss": 1.3035, "step": 20439 }, { "epoch": 0.56, "learning_rate": 8.605271532390666e-06, "loss": 1.1567, "step": 20440 }, { "epoch": 0.56, "learning_rate": 8.604395675918461e-06, "loss": 1.2424, "step": 20441 }, { "epoch": 0.56, "learning_rate": 8.60351983036481e-06, "loss": 1.2917, "step": 20442 }, { "epoch": 0.56, "learning_rate": 8.60264399573656e-06, "loss": 1.1575, "step": 20443 }, { "epoch": 0.56, "learning_rate": 8.60176817204057e-06, "loss": 1.1682, "step": 20444 }, { "epoch": 0.56, "learning_rate": 8.600892359283684e-06, "loss": 1.2415, "step": 20445 }, { "epoch": 0.56, "learning_rate": 8.600016557472762e-06, "loss": 1.1755, "step": 20446 }, { "epoch": 0.56, "learning_rate": 8.599140766614648e-06, "loss": 1.3357, "step": 20447 }, { "epoch": 0.56, "learning_rate": 8.598264986716202e-06, "loss": 1.3376, "step": 20448 }, { "epoch": 0.56, "learning_rate": 8.597389217784268e-06, "loss": 1.3218, "step": 20449 }, { "epoch": 0.56, "learning_rate": 8.596513459825705e-06, "loss": 1.314, "step": 20450 }, { "epoch": 0.56, "learning_rate": 8.595637712847357e-06, "loss": 1.6851, "step": 20451 }, { "epoch": 0.56, "learning_rate": 8.594761976856082e-06, "loss": 1.2686, "step": 20452 }, { "epoch": 0.56, "learning_rate": 8.593886251858727e-06, "loss": 1.2778, "step": 20453 }, { "epoch": 0.56, "learning_rate": 8.593010537862147e-06, "loss": 1.177, "step": 20454 }, { "epoch": 0.56, "learning_rate": 8.592134834873186e-06, "loss": 1.3037, "step": 20455 }, { "epoch": 0.56, "learning_rate": 8.591259142898702e-06, "loss": 1.6958, "step": 20456 }, { "epoch": 0.56, "learning_rate": 8.590383461945549e-06, "loss": 1.2744, "step": 20457 }, { "epoch": 0.56, "learning_rate": 8.589507792020565e-06, "loss": 1.3059, "step": 20458 }, { "epoch": 0.56, "learning_rate": 8.588632133130617e-06, "loss": 1.4177, "step": 20459 }, { "epoch": 0.56, "learning_rate": 8.58775648528254e-06, "loss": 1.0441, "step": 20460 }, { "epoch": 0.56, "learning_rate": 8.586880848483199e-06, "loss": 1.3931, "step": 20461 }, { "epoch": 0.56, "learning_rate": 8.58600522273943e-06, "loss": 1.2632, "step": 20462 }, { "epoch": 0.56, "learning_rate": 8.5851296080581e-06, "loss": 1.1421, "step": 20463 }, { "epoch": 0.56, "learning_rate": 8.584254004446043e-06, "loss": 1.3386, "step": 20464 }, { "epoch": 0.56, "learning_rate": 8.583378411910125e-06, "loss": 1.1177, "step": 20465 }, { "epoch": 0.56, "learning_rate": 8.582502830457178e-06, "loss": 1.2302, "step": 20466 }, { "epoch": 0.56, "learning_rate": 8.581627260094072e-06, "loss": 1.2886, "step": 20467 }, { "epoch": 0.56, "learning_rate": 8.580751700827639e-06, "loss": 1.2021, "step": 20468 }, { "epoch": 0.56, "learning_rate": 8.579876152664746e-06, "loss": 1.322, "step": 20469 }, { "epoch": 0.56, "learning_rate": 8.579000615612225e-06, "loss": 1.5293, "step": 20470 }, { "epoch": 0.56, "learning_rate": 8.578125089676944e-06, "loss": 1.2539, "step": 20471 }, { "epoch": 0.56, "learning_rate": 8.577249574865734e-06, "loss": 1.1409, "step": 20472 }, { "epoch": 0.56, "learning_rate": 8.576374071185459e-06, "loss": 1.3259, "step": 20473 }, { "epoch": 0.56, "learning_rate": 8.575498578642966e-06, "loss": 1.3479, "step": 20474 }, { "epoch": 0.56, "learning_rate": 8.5746230972451e-06, "loss": 1.3779, "step": 20475 }, { "epoch": 0.56, "learning_rate": 8.573747626998715e-06, "loss": 1.3911, "step": 20476 }, { "epoch": 0.56, "learning_rate": 8.572872167910654e-06, "loss": 1.3062, "step": 20477 }, { "epoch": 0.56, "learning_rate": 8.571996719987774e-06, "loss": 1.4902, "step": 20478 }, { "epoch": 0.56, "learning_rate": 8.571121283236915e-06, "loss": 1.1577, "step": 20479 }, { "epoch": 0.56, "learning_rate": 8.570245857664936e-06, "loss": 1.219, "step": 20480 }, { "epoch": 0.56, "learning_rate": 8.56937044327868e-06, "loss": 1.0765, "step": 20481 }, { "epoch": 0.56, "learning_rate": 8.568495040084998e-06, "loss": 1.1995, "step": 20482 }, { "epoch": 0.56, "learning_rate": 8.567619648090735e-06, "loss": 1.3616, "step": 20483 }, { "epoch": 0.56, "learning_rate": 8.566744267302745e-06, "loss": 1.1758, "step": 20484 }, { "epoch": 0.56, "learning_rate": 8.565868897727872e-06, "loss": 1.427, "step": 20485 }, { "epoch": 0.56, "learning_rate": 8.564993539372967e-06, "loss": 1.2576, "step": 20486 }, { "epoch": 0.56, "learning_rate": 8.564118192244877e-06, "loss": 1.1237, "step": 20487 }, { "epoch": 0.56, "learning_rate": 8.56324285635045e-06, "loss": 1.2764, "step": 20488 }, { "epoch": 0.56, "learning_rate": 8.562367531696538e-06, "loss": 1.3345, "step": 20489 }, { "epoch": 0.56, "learning_rate": 8.561492218289985e-06, "loss": 1.356, "step": 20490 }, { "epoch": 0.56, "learning_rate": 8.56061691613764e-06, "loss": 1.4351, "step": 20491 }, { "epoch": 0.56, "learning_rate": 8.559741625246351e-06, "loss": 1.4268, "step": 20492 }, { "epoch": 0.56, "learning_rate": 8.558866345622969e-06, "loss": 1.4497, "step": 20493 }, { "epoch": 0.56, "learning_rate": 8.557991077274337e-06, "loss": 1.2341, "step": 20494 }, { "epoch": 0.56, "learning_rate": 8.557115820207306e-06, "loss": 1.303, "step": 20495 }, { "epoch": 0.56, "learning_rate": 8.556240574428721e-06, "loss": 1.3037, "step": 20496 }, { "epoch": 0.56, "learning_rate": 8.555365339945434e-06, "loss": 1.1533, "step": 20497 }, { "epoch": 0.56, "learning_rate": 8.554490116764285e-06, "loss": 1.1921, "step": 20498 }, { "epoch": 0.56, "learning_rate": 8.553614904892129e-06, "loss": 1.0935, "step": 20499 }, { "epoch": 0.56, "learning_rate": 8.552739704335806e-06, "loss": 1.2727, "step": 20500 }, { "epoch": 0.56, "learning_rate": 8.55186451510217e-06, "loss": 1.2595, "step": 20501 }, { "epoch": 0.56, "learning_rate": 8.550989337198063e-06, "loss": 1.2229, "step": 20502 }, { "epoch": 0.56, "learning_rate": 8.550114170630333e-06, "loss": 1.1917, "step": 20503 }, { "epoch": 0.56, "learning_rate": 8.549239015405833e-06, "loss": 1.2256, "step": 20504 }, { "epoch": 0.56, "learning_rate": 8.548363871531398e-06, "loss": 1.2751, "step": 20505 }, { "epoch": 0.56, "learning_rate": 8.54748873901389e-06, "loss": 1.2666, "step": 20506 }, { "epoch": 0.56, "learning_rate": 8.546613617860138e-06, "loss": 1.1726, "step": 20507 }, { "epoch": 0.56, "learning_rate": 8.545738508077007e-06, "loss": 1.3682, "step": 20508 }, { "epoch": 0.56, "learning_rate": 8.544863409671324e-06, "loss": 1.384, "step": 20509 }, { "epoch": 0.56, "learning_rate": 8.543988322649954e-06, "loss": 1.2932, "step": 20510 }, { "epoch": 0.56, "learning_rate": 8.543113247019729e-06, "loss": 1.217, "step": 20511 }, { "epoch": 0.56, "learning_rate": 8.542238182787506e-06, "loss": 1.3142, "step": 20512 }, { "epoch": 0.56, "learning_rate": 8.541363129960119e-06, "loss": 1.3762, "step": 20513 }, { "epoch": 0.56, "learning_rate": 8.54048808854443e-06, "loss": 1.231, "step": 20514 }, { "epoch": 0.56, "learning_rate": 8.539613058547267e-06, "loss": 1.2832, "step": 20515 }, { "epoch": 0.56, "learning_rate": 8.538738039975492e-06, "loss": 1.2686, "step": 20516 }, { "epoch": 0.56, "learning_rate": 8.537863032835937e-06, "loss": 1.2412, "step": 20517 }, { "epoch": 0.56, "learning_rate": 8.536988037135456e-06, "loss": 1.3501, "step": 20518 }, { "epoch": 0.56, "learning_rate": 8.536113052880895e-06, "loss": 1.2102, "step": 20519 }, { "epoch": 0.56, "learning_rate": 8.535238080079096e-06, "loss": 1.178, "step": 20520 }, { "epoch": 0.56, "learning_rate": 8.534363118736905e-06, "loss": 1.4626, "step": 20521 }, { "epoch": 0.56, "learning_rate": 8.533488168861167e-06, "loss": 1.1511, "step": 20522 }, { "epoch": 0.56, "learning_rate": 8.532613230458731e-06, "loss": 1.2383, "step": 20523 }, { "epoch": 0.56, "learning_rate": 8.531738303536436e-06, "loss": 1.3521, "step": 20524 }, { "epoch": 0.56, "learning_rate": 8.530863388101132e-06, "loss": 1.4373, "step": 20525 }, { "epoch": 0.56, "learning_rate": 8.529988484159662e-06, "loss": 1.7998, "step": 20526 }, { "epoch": 0.56, "learning_rate": 8.52911359171887e-06, "loss": 1.2395, "step": 20527 }, { "epoch": 0.56, "learning_rate": 8.528238710785602e-06, "loss": 1.4299, "step": 20528 }, { "epoch": 0.56, "learning_rate": 8.527363841366703e-06, "loss": 1.2461, "step": 20529 }, { "epoch": 0.56, "learning_rate": 8.526488983469014e-06, "loss": 1.322, "step": 20530 }, { "epoch": 0.56, "learning_rate": 8.525614137099386e-06, "loss": 1.2568, "step": 20531 }, { "epoch": 0.56, "learning_rate": 8.524739302264656e-06, "loss": 1.3477, "step": 20532 }, { "epoch": 0.56, "learning_rate": 8.523864478971675e-06, "loss": 1.3752, "step": 20533 }, { "epoch": 0.56, "learning_rate": 8.522989667227283e-06, "loss": 1.0984, "step": 20534 }, { "epoch": 0.56, "learning_rate": 8.522114867038323e-06, "loss": 1.312, "step": 20535 }, { "epoch": 0.56, "learning_rate": 8.521240078411646e-06, "loss": 1.3467, "step": 20536 }, { "epoch": 0.56, "learning_rate": 8.520365301354087e-06, "loss": 1.4087, "step": 20537 }, { "epoch": 0.56, "learning_rate": 8.519490535872499e-06, "loss": 1.3677, "step": 20538 }, { "epoch": 0.56, "learning_rate": 8.518615781973716e-06, "loss": 1.1375, "step": 20539 }, { "epoch": 0.56, "learning_rate": 8.517741039664588e-06, "loss": 1.2683, "step": 20540 }, { "epoch": 0.56, "learning_rate": 8.516866308951957e-06, "loss": 1.2441, "step": 20541 }, { "epoch": 0.56, "learning_rate": 8.51599158984267e-06, "loss": 1.3256, "step": 20542 }, { "epoch": 0.56, "learning_rate": 8.515116882343563e-06, "loss": 1.3804, "step": 20543 }, { "epoch": 0.56, "learning_rate": 8.514242186461485e-06, "loss": 1.3486, "step": 20544 }, { "epoch": 0.56, "learning_rate": 8.513367502203277e-06, "loss": 1.2786, "step": 20545 }, { "epoch": 0.56, "learning_rate": 8.512492829575783e-06, "loss": 1.3501, "step": 20546 }, { "epoch": 0.56, "learning_rate": 8.511618168585844e-06, "loss": 1.228, "step": 20547 }, { "epoch": 0.56, "learning_rate": 8.510743519240305e-06, "loss": 1.3025, "step": 20548 }, { "epoch": 0.56, "learning_rate": 8.509868881546008e-06, "loss": 1.3252, "step": 20549 }, { "epoch": 0.56, "learning_rate": 8.508994255509795e-06, "loss": 1.3984, "step": 20550 }, { "epoch": 0.56, "learning_rate": 8.508119641138514e-06, "loss": 1.1284, "step": 20551 }, { "epoch": 0.56, "learning_rate": 8.507245038438999e-06, "loss": 1.3235, "step": 20552 }, { "epoch": 0.56, "learning_rate": 8.506370447418104e-06, "loss": 1.6965, "step": 20553 }, { "epoch": 0.56, "learning_rate": 8.505495868082656e-06, "loss": 1.323, "step": 20554 }, { "epoch": 0.56, "learning_rate": 8.504621300439512e-06, "loss": 1.1602, "step": 20555 }, { "epoch": 0.56, "learning_rate": 8.503746744495501e-06, "loss": 1.2639, "step": 20556 }, { "epoch": 0.56, "learning_rate": 8.502872200257479e-06, "loss": 1.1714, "step": 20557 }, { "epoch": 0.56, "learning_rate": 8.501997667732275e-06, "loss": 1.3672, "step": 20558 }, { "epoch": 0.56, "learning_rate": 8.50112314692674e-06, "loss": 1.4946, "step": 20559 }, { "epoch": 0.56, "learning_rate": 8.500248637847712e-06, "loss": 1.2451, "step": 20560 }, { "epoch": 0.56, "learning_rate": 8.499374140502035e-06, "loss": 1.2922, "step": 20561 }, { "epoch": 0.56, "learning_rate": 8.498499654896546e-06, "loss": 1.3892, "step": 20562 }, { "epoch": 0.56, "learning_rate": 8.497625181038093e-06, "loss": 1.1337, "step": 20563 }, { "epoch": 0.56, "learning_rate": 8.496750718933511e-06, "loss": 1.2815, "step": 20564 }, { "epoch": 0.56, "learning_rate": 8.495876268589645e-06, "loss": 1.3367, "step": 20565 }, { "epoch": 0.56, "learning_rate": 8.495001830013338e-06, "loss": 1.2148, "step": 20566 }, { "epoch": 0.56, "learning_rate": 8.494127403211428e-06, "loss": 1.2949, "step": 20567 }, { "epoch": 0.56, "learning_rate": 8.493252988190757e-06, "loss": 1.2164, "step": 20568 }, { "epoch": 0.56, "learning_rate": 8.492378584958165e-06, "loss": 1.2118, "step": 20569 }, { "epoch": 0.56, "learning_rate": 8.491504193520495e-06, "loss": 1.3181, "step": 20570 }, { "epoch": 0.56, "learning_rate": 8.490629813884586e-06, "loss": 1.4011, "step": 20571 }, { "epoch": 0.56, "learning_rate": 8.489755446057282e-06, "loss": 1.3313, "step": 20572 }, { "epoch": 0.56, "learning_rate": 8.488881090045419e-06, "loss": 1.3845, "step": 20573 }, { "epoch": 0.56, "learning_rate": 8.488006745855841e-06, "loss": 1.2834, "step": 20574 }, { "epoch": 0.56, "learning_rate": 8.487132413495386e-06, "loss": 1.1584, "step": 20575 }, { "epoch": 0.56, "learning_rate": 8.486258092970898e-06, "loss": 1.4419, "step": 20576 }, { "epoch": 0.56, "learning_rate": 8.48538378428921e-06, "loss": 1.2781, "step": 20577 }, { "epoch": 0.56, "learning_rate": 8.484509487457173e-06, "loss": 1.3481, "step": 20578 }, { "epoch": 0.56, "learning_rate": 8.483635202481617e-06, "loss": 1.2629, "step": 20579 }, { "epoch": 0.56, "learning_rate": 8.482760929369386e-06, "loss": 1.7051, "step": 20580 }, { "epoch": 0.56, "learning_rate": 8.481886668127323e-06, "loss": 1.1626, "step": 20581 }, { "epoch": 0.56, "learning_rate": 8.481012418762262e-06, "loss": 1.2917, "step": 20582 }, { "epoch": 0.56, "learning_rate": 8.480138181281049e-06, "loss": 1.7529, "step": 20583 }, { "epoch": 0.56, "learning_rate": 8.479263955690516e-06, "loss": 1.4568, "step": 20584 }, { "epoch": 0.56, "learning_rate": 8.478389741997509e-06, "loss": 1.3352, "step": 20585 }, { "epoch": 0.56, "learning_rate": 8.477515540208865e-06, "loss": 1.3857, "step": 20586 }, { "epoch": 0.56, "learning_rate": 8.476641350331424e-06, "loss": 1.252, "step": 20587 }, { "epoch": 0.56, "learning_rate": 8.475767172372022e-06, "loss": 1.2642, "step": 20588 }, { "epoch": 0.56, "learning_rate": 8.474893006337504e-06, "loss": 1.2861, "step": 20589 }, { "epoch": 0.56, "learning_rate": 8.474018852234705e-06, "loss": 1.2131, "step": 20590 }, { "epoch": 0.56, "learning_rate": 8.473144710070466e-06, "loss": 1.4697, "step": 20591 }, { "epoch": 0.56, "learning_rate": 8.47227057985162e-06, "loss": 1.2083, "step": 20592 }, { "epoch": 0.56, "learning_rate": 8.471396461585018e-06, "loss": 1.1199, "step": 20593 }, { "epoch": 0.56, "learning_rate": 8.470522355277483e-06, "loss": 1.4204, "step": 20594 }, { "epoch": 0.56, "learning_rate": 8.469648260935871e-06, "loss": 1.4622, "step": 20595 }, { "epoch": 0.56, "learning_rate": 8.468774178567003e-06, "loss": 1.2368, "step": 20596 }, { "epoch": 0.56, "learning_rate": 8.46790010817773e-06, "loss": 1.24, "step": 20597 }, { "epoch": 0.56, "learning_rate": 8.467026049774886e-06, "loss": 1.3503, "step": 20598 }, { "epoch": 0.56, "learning_rate": 8.466152003365308e-06, "loss": 1.3525, "step": 20599 }, { "epoch": 0.56, "learning_rate": 8.465277968955837e-06, "loss": 1.3438, "step": 20600 }, { "epoch": 0.56, "learning_rate": 8.464403946553308e-06, "loss": 1.3252, "step": 20601 }, { "epoch": 0.56, "learning_rate": 8.463529936164563e-06, "loss": 1.2659, "step": 20602 }, { "epoch": 0.56, "learning_rate": 8.462655937796434e-06, "loss": 1.3586, "step": 20603 }, { "epoch": 0.56, "learning_rate": 8.461781951455766e-06, "loss": 1.3386, "step": 20604 }, { "epoch": 0.56, "learning_rate": 8.460907977149388e-06, "loss": 1.1477, "step": 20605 }, { "epoch": 0.56, "learning_rate": 8.460034014884146e-06, "loss": 1.2976, "step": 20606 }, { "epoch": 0.56, "learning_rate": 8.459160064666872e-06, "loss": 1.3994, "step": 20607 }, { "epoch": 0.56, "learning_rate": 8.458286126504406e-06, "loss": 1.3577, "step": 20608 }, { "epoch": 0.56, "learning_rate": 8.457412200403585e-06, "loss": 1.4248, "step": 20609 }, { "epoch": 0.56, "learning_rate": 8.456538286371245e-06, "loss": 1.283, "step": 20610 }, { "epoch": 0.56, "learning_rate": 8.455664384414222e-06, "loss": 1.2781, "step": 20611 }, { "epoch": 0.56, "learning_rate": 8.454790494539355e-06, "loss": 1.2739, "step": 20612 }, { "epoch": 0.56, "learning_rate": 8.453916616753482e-06, "loss": 1.2808, "step": 20613 }, { "epoch": 0.56, "learning_rate": 8.453042751063437e-06, "loss": 1.4673, "step": 20614 }, { "epoch": 0.56, "learning_rate": 8.452168897476059e-06, "loss": 1.2297, "step": 20615 }, { "epoch": 0.56, "learning_rate": 8.451295055998183e-06, "loss": 1.4307, "step": 20616 }, { "epoch": 0.56, "learning_rate": 8.450421226636649e-06, "loss": 1.2771, "step": 20617 }, { "epoch": 0.56, "learning_rate": 8.449547409398287e-06, "loss": 1.2617, "step": 20618 }, { "epoch": 0.56, "learning_rate": 8.448673604289939e-06, "loss": 1.2532, "step": 20619 }, { "epoch": 0.56, "learning_rate": 8.447799811318438e-06, "loss": 1.1675, "step": 20620 }, { "epoch": 0.56, "learning_rate": 8.446926030490623e-06, "loss": 1.328, "step": 20621 }, { "epoch": 0.56, "learning_rate": 8.446052261813326e-06, "loss": 1.408, "step": 20622 }, { "epoch": 0.56, "learning_rate": 8.445178505293388e-06, "loss": 1.3408, "step": 20623 }, { "epoch": 0.56, "learning_rate": 8.444304760937641e-06, "loss": 1.3359, "step": 20624 }, { "epoch": 0.56, "learning_rate": 8.443431028752922e-06, "loss": 1.1499, "step": 20625 }, { "epoch": 0.56, "learning_rate": 8.442557308746066e-06, "loss": 1.3945, "step": 20626 }, { "epoch": 0.56, "learning_rate": 8.441683600923907e-06, "loss": 1.2632, "step": 20627 }, { "epoch": 0.56, "learning_rate": 8.44080990529329e-06, "loss": 1.4485, "step": 20628 }, { "epoch": 0.56, "learning_rate": 8.439936221861035e-06, "loss": 1.2224, "step": 20629 }, { "epoch": 0.56, "learning_rate": 8.439062550633992e-06, "loss": 1.3381, "step": 20630 }, { "epoch": 0.56, "learning_rate": 8.438188891618983e-06, "loss": 1.3384, "step": 20631 }, { "epoch": 0.56, "learning_rate": 8.437315244822858e-06, "loss": 1.1284, "step": 20632 }, { "epoch": 0.56, "learning_rate": 8.436441610252435e-06, "loss": 1.3442, "step": 20633 }, { "epoch": 0.56, "learning_rate": 8.435567987914566e-06, "loss": 1.251, "step": 20634 }, { "epoch": 0.56, "learning_rate": 8.43469437781607e-06, "loss": 1.3748, "step": 20635 }, { "epoch": 0.56, "learning_rate": 8.433820779963796e-06, "loss": 1.2722, "step": 20636 }, { "epoch": 0.56, "learning_rate": 8.432947194364565e-06, "loss": 1.2849, "step": 20637 }, { "epoch": 0.56, "learning_rate": 8.432073621025226e-06, "loss": 1.3279, "step": 20638 }, { "epoch": 0.56, "learning_rate": 8.431200059952597e-06, "loss": 1.3142, "step": 20639 }, { "epoch": 0.56, "learning_rate": 8.430326511153529e-06, "loss": 1.418, "step": 20640 }, { "epoch": 0.56, "learning_rate": 8.42945297463484e-06, "loss": 1.3301, "step": 20641 }, { "epoch": 0.56, "learning_rate": 8.428579450403376e-06, "loss": 1.2859, "step": 20642 }, { "epoch": 0.56, "learning_rate": 8.42770593846597e-06, "loss": 1.2744, "step": 20643 }, { "epoch": 0.56, "learning_rate": 8.426832438829452e-06, "loss": 1.1936, "step": 20644 }, { "epoch": 0.56, "learning_rate": 8.425958951500657e-06, "loss": 1.2334, "step": 20645 }, { "epoch": 0.56, "learning_rate": 8.425085476486418e-06, "loss": 1.1946, "step": 20646 }, { "epoch": 0.56, "learning_rate": 8.424212013793572e-06, "loss": 1.3542, "step": 20647 }, { "epoch": 0.56, "learning_rate": 8.423338563428947e-06, "loss": 1.4138, "step": 20648 }, { "epoch": 0.56, "learning_rate": 8.422465125399383e-06, "loss": 1.3813, "step": 20649 }, { "epoch": 0.56, "learning_rate": 8.421591699711706e-06, "loss": 1.3994, "step": 20650 }, { "epoch": 0.56, "learning_rate": 8.420718286372757e-06, "loss": 1.2476, "step": 20651 }, { "epoch": 0.56, "learning_rate": 8.419844885389364e-06, "loss": 1.3113, "step": 20652 }, { "epoch": 0.56, "learning_rate": 8.418971496768363e-06, "loss": 1.2639, "step": 20653 }, { "epoch": 0.56, "learning_rate": 8.418098120516584e-06, "loss": 1.4045, "step": 20654 }, { "epoch": 0.56, "learning_rate": 8.417224756640863e-06, "loss": 1.23, "step": 20655 }, { "epoch": 0.56, "learning_rate": 8.41635140514803e-06, "loss": 1.7017, "step": 20656 }, { "epoch": 0.56, "learning_rate": 8.41547806604492e-06, "loss": 1.377, "step": 20657 }, { "epoch": 0.56, "learning_rate": 8.414604739338361e-06, "loss": 1.335, "step": 20658 }, { "epoch": 0.56, "learning_rate": 8.41373142503519e-06, "loss": 1.2146, "step": 20659 }, { "epoch": 0.56, "learning_rate": 8.412858123142242e-06, "loss": 1.564, "step": 20660 }, { "epoch": 0.56, "learning_rate": 8.411984833666343e-06, "loss": 1.2717, "step": 20661 }, { "epoch": 0.56, "learning_rate": 8.41111155661433e-06, "loss": 1.2947, "step": 20662 }, { "epoch": 0.56, "learning_rate": 8.41023829199303e-06, "loss": 1.2722, "step": 20663 }, { "epoch": 0.56, "learning_rate": 8.409365039809282e-06, "loss": 1.2983, "step": 20664 }, { "epoch": 0.56, "learning_rate": 8.40849180006991e-06, "loss": 1.2358, "step": 20665 }, { "epoch": 0.56, "learning_rate": 8.407618572781753e-06, "loss": 1.2632, "step": 20666 }, { "epoch": 0.56, "learning_rate": 8.406745357951636e-06, "loss": 1.4424, "step": 20667 }, { "epoch": 0.56, "learning_rate": 8.405872155586397e-06, "loss": 1.1721, "step": 20668 }, { "epoch": 0.56, "learning_rate": 8.404998965692864e-06, "loss": 1.26, "step": 20669 }, { "epoch": 0.56, "learning_rate": 8.40412578827787e-06, "loss": 1.2297, "step": 20670 }, { "epoch": 0.56, "learning_rate": 8.403252623348243e-06, "loss": 1.157, "step": 20671 }, { "epoch": 0.56, "learning_rate": 8.402379470910818e-06, "loss": 1.6987, "step": 20672 }, { "epoch": 0.56, "learning_rate": 8.401506330972424e-06, "loss": 1.0684, "step": 20673 }, { "epoch": 0.56, "learning_rate": 8.40063320353989e-06, "loss": 1.199, "step": 20674 }, { "epoch": 0.56, "learning_rate": 8.399760088620057e-06, "loss": 1.4246, "step": 20675 }, { "epoch": 0.56, "learning_rate": 8.398886986219741e-06, "loss": 1.3052, "step": 20676 }, { "epoch": 0.56, "learning_rate": 8.398013896345788e-06, "loss": 1.3779, "step": 20677 }, { "epoch": 0.56, "learning_rate": 8.397140819005014e-06, "loss": 1.3572, "step": 20678 }, { "epoch": 0.56, "learning_rate": 8.396267754204263e-06, "loss": 1.2795, "step": 20679 }, { "epoch": 0.56, "learning_rate": 8.395394701950352e-06, "loss": 1.3179, "step": 20680 }, { "epoch": 0.56, "learning_rate": 8.394521662250124e-06, "loss": 1.2693, "step": 20681 }, { "epoch": 0.56, "learning_rate": 8.393648635110398e-06, "loss": 1.3618, "step": 20682 }, { "epoch": 0.56, "learning_rate": 8.392775620538018e-06, "loss": 1.3303, "step": 20683 }, { "epoch": 0.56, "learning_rate": 8.391902618539798e-06, "loss": 1.1772, "step": 20684 }, { "epoch": 0.56, "learning_rate": 8.39102962912258e-06, "loss": 1.1863, "step": 20685 }, { "epoch": 0.56, "learning_rate": 8.390156652293187e-06, "loss": 1.187, "step": 20686 }, { "epoch": 0.56, "learning_rate": 8.389283688058454e-06, "loss": 1.3882, "step": 20687 }, { "epoch": 0.56, "learning_rate": 8.388410736425205e-06, "loss": 1.3274, "step": 20688 }, { "epoch": 0.57, "learning_rate": 8.387537797400273e-06, "loss": 1.2549, "step": 20689 }, { "epoch": 0.57, "learning_rate": 8.386664870990489e-06, "loss": 1.3799, "step": 20690 }, { "epoch": 0.57, "learning_rate": 8.385791957202678e-06, "loss": 1.343, "step": 20691 }, { "epoch": 0.57, "learning_rate": 8.384919056043674e-06, "loss": 1.4717, "step": 20692 }, { "epoch": 0.57, "learning_rate": 8.384046167520304e-06, "loss": 1.2188, "step": 20693 }, { "epoch": 0.57, "learning_rate": 8.383173291639396e-06, "loss": 1.3496, "step": 20694 }, { "epoch": 0.57, "learning_rate": 8.38230042840778e-06, "loss": 1.2327, "step": 20695 }, { "epoch": 0.57, "learning_rate": 8.381427577832285e-06, "loss": 1.2494, "step": 20696 }, { "epoch": 0.57, "learning_rate": 8.380554739919737e-06, "loss": 1.3877, "step": 20697 }, { "epoch": 0.57, "learning_rate": 8.379681914676971e-06, "loss": 1.3076, "step": 20698 }, { "epoch": 0.57, "learning_rate": 8.37880910211081e-06, "loss": 1.2646, "step": 20699 }, { "epoch": 0.57, "learning_rate": 8.377936302228084e-06, "loss": 1.2825, "step": 20700 }, { "epoch": 0.57, "learning_rate": 8.37706351503562e-06, "loss": 1.1456, "step": 20701 }, { "epoch": 0.57, "learning_rate": 8.376190740540254e-06, "loss": 1.2285, "step": 20702 }, { "epoch": 0.57, "learning_rate": 8.3753179787488e-06, "loss": 1.0769, "step": 20703 }, { "epoch": 0.57, "learning_rate": 8.374445229668098e-06, "loss": 1.2981, "step": 20704 }, { "epoch": 0.57, "learning_rate": 8.373572493304974e-06, "loss": 1.2947, "step": 20705 }, { "epoch": 0.57, "learning_rate": 8.372699769666251e-06, "loss": 1.238, "step": 20706 }, { "epoch": 0.57, "learning_rate": 8.371827058758763e-06, "loss": 1.4272, "step": 20707 }, { "epoch": 0.57, "learning_rate": 8.370954360589331e-06, "loss": 1.3447, "step": 20708 }, { "epoch": 0.57, "learning_rate": 8.37008167516479e-06, "loss": 1.4429, "step": 20709 }, { "epoch": 0.57, "learning_rate": 8.36920900249196e-06, "loss": 1.4236, "step": 20710 }, { "epoch": 0.57, "learning_rate": 8.368336342577674e-06, "loss": 1.302, "step": 20711 }, { "epoch": 0.57, "learning_rate": 8.367463695428755e-06, "loss": 1.2371, "step": 20712 }, { "epoch": 0.57, "learning_rate": 8.366591061052033e-06, "loss": 1.2913, "step": 20713 }, { "epoch": 0.57, "learning_rate": 8.365718439454335e-06, "loss": 1.2656, "step": 20714 }, { "epoch": 0.57, "learning_rate": 8.364845830642488e-06, "loss": 1.4043, "step": 20715 }, { "epoch": 0.57, "learning_rate": 8.363973234623316e-06, "loss": 1.2664, "step": 20716 }, { "epoch": 0.57, "learning_rate": 8.363100651403652e-06, "loss": 1.3608, "step": 20717 }, { "epoch": 0.57, "learning_rate": 8.362228080990317e-06, "loss": 1.3354, "step": 20718 }, { "epoch": 0.57, "learning_rate": 8.36135552339014e-06, "loss": 1.2275, "step": 20719 }, { "epoch": 0.57, "learning_rate": 8.360482978609946e-06, "loss": 1.7412, "step": 20720 }, { "epoch": 0.57, "learning_rate": 8.359610446656558e-06, "loss": 1.3496, "step": 20721 }, { "epoch": 0.57, "learning_rate": 8.358737927536813e-06, "loss": 1.2473, "step": 20722 }, { "epoch": 0.57, "learning_rate": 8.357865421257524e-06, "loss": 1.3577, "step": 20723 }, { "epoch": 0.57, "learning_rate": 8.356992927825533e-06, "loss": 1.3774, "step": 20724 }, { "epoch": 0.57, "learning_rate": 8.35612044724765e-06, "loss": 1.2717, "step": 20725 }, { "epoch": 0.57, "learning_rate": 8.35524797953071e-06, "loss": 1.2979, "step": 20726 }, { "epoch": 0.57, "learning_rate": 8.354375524681534e-06, "loss": 1.2009, "step": 20727 }, { "epoch": 0.57, "learning_rate": 8.353503082706955e-06, "loss": 1.3938, "step": 20728 }, { "epoch": 0.57, "learning_rate": 8.352630653613788e-06, "loss": 1.2639, "step": 20729 }, { "epoch": 0.57, "learning_rate": 8.35175823740887e-06, "loss": 1.7729, "step": 20730 }, { "epoch": 0.57, "learning_rate": 8.350885834099012e-06, "loss": 1.3491, "step": 20731 }, { "epoch": 0.57, "learning_rate": 8.350013443691057e-06, "loss": 1.2004, "step": 20732 }, { "epoch": 0.57, "learning_rate": 8.349141066191813e-06, "loss": 1.3784, "step": 20733 }, { "epoch": 0.57, "learning_rate": 8.34826870160812e-06, "loss": 1.1421, "step": 20734 }, { "epoch": 0.57, "learning_rate": 8.34739634994679e-06, "loss": 1.2578, "step": 20735 }, { "epoch": 0.57, "learning_rate": 8.346524011214656e-06, "loss": 1.377, "step": 20736 }, { "epoch": 0.57, "learning_rate": 8.345651685418544e-06, "loss": 1.0842, "step": 20737 }, { "epoch": 0.57, "learning_rate": 8.344779372565271e-06, "loss": 1.3499, "step": 20738 }, { "epoch": 0.57, "learning_rate": 8.343907072661668e-06, "loss": 1.3, "step": 20739 }, { "epoch": 0.57, "learning_rate": 8.343034785714556e-06, "loss": 1.6904, "step": 20740 }, { "epoch": 0.57, "learning_rate": 8.342162511730763e-06, "loss": 1.1677, "step": 20741 }, { "epoch": 0.57, "learning_rate": 8.341290250717107e-06, "loss": 1.1475, "step": 20742 }, { "epoch": 0.57, "learning_rate": 8.340418002680419e-06, "loss": 1.2092, "step": 20743 }, { "epoch": 0.57, "learning_rate": 8.339545767627518e-06, "loss": 1.375, "step": 20744 }, { "epoch": 0.57, "learning_rate": 8.338673545565234e-06, "loss": 1.3062, "step": 20745 }, { "epoch": 0.57, "learning_rate": 8.337801336500384e-06, "loss": 1.3601, "step": 20746 }, { "epoch": 0.57, "learning_rate": 8.336929140439796e-06, "loss": 1.2043, "step": 20747 }, { "epoch": 0.57, "learning_rate": 8.336056957390291e-06, "loss": 1.282, "step": 20748 }, { "epoch": 0.57, "learning_rate": 8.335184787358696e-06, "loss": 1.3784, "step": 20749 }, { "epoch": 0.57, "learning_rate": 8.33431263035183e-06, "loss": 1.3215, "step": 20750 }, { "epoch": 0.57, "learning_rate": 8.333440486376518e-06, "loss": 1.2642, "step": 20751 }, { "epoch": 0.57, "learning_rate": 8.332568355439588e-06, "loss": 1.3013, "step": 20752 }, { "epoch": 0.57, "learning_rate": 8.331696237547855e-06, "loss": 1.0942, "step": 20753 }, { "epoch": 0.57, "learning_rate": 8.330824132708149e-06, "loss": 1.2659, "step": 20754 }, { "epoch": 0.57, "learning_rate": 8.329952040927289e-06, "loss": 1.1074, "step": 20755 }, { "epoch": 0.57, "learning_rate": 8.3290799622121e-06, "loss": 1.2737, "step": 20756 }, { "epoch": 0.57, "learning_rate": 8.328207896569401e-06, "loss": 1.2302, "step": 20757 }, { "epoch": 0.57, "learning_rate": 8.32733584400602e-06, "loss": 1.1621, "step": 20758 }, { "epoch": 0.57, "learning_rate": 8.326463804528774e-06, "loss": 1.3762, "step": 20759 }, { "epoch": 0.57, "learning_rate": 8.325591778144494e-06, "loss": 1.3157, "step": 20760 }, { "epoch": 0.57, "learning_rate": 8.32471976485999e-06, "loss": 1.4541, "step": 20761 }, { "epoch": 0.57, "learning_rate": 8.323847764682095e-06, "loss": 1.3242, "step": 20762 }, { "epoch": 0.57, "learning_rate": 8.322975777617623e-06, "loss": 1.2888, "step": 20763 }, { "epoch": 0.57, "learning_rate": 8.322103803673403e-06, "loss": 1.4248, "step": 20764 }, { "epoch": 0.57, "learning_rate": 8.321231842856254e-06, "loss": 1.2053, "step": 20765 }, { "epoch": 0.57, "learning_rate": 8.320359895172993e-06, "loss": 1.1157, "step": 20766 }, { "epoch": 0.57, "learning_rate": 8.319487960630452e-06, "loss": 1.2168, "step": 20767 }, { "epoch": 0.57, "learning_rate": 8.318616039235443e-06, "loss": 1.178, "step": 20768 }, { "epoch": 0.57, "learning_rate": 8.317744130994796e-06, "loss": 1.3086, "step": 20769 }, { "epoch": 0.57, "learning_rate": 8.316872235915323e-06, "loss": 1.2065, "step": 20770 }, { "epoch": 0.57, "learning_rate": 8.316000354003856e-06, "loss": 1.3262, "step": 20771 }, { "epoch": 0.57, "learning_rate": 8.315128485267203e-06, "loss": 1.2939, "step": 20772 }, { "epoch": 0.57, "learning_rate": 8.3142566297122e-06, "loss": 1.3303, "step": 20773 }, { "epoch": 0.57, "learning_rate": 8.313384787345653e-06, "loss": 1.3586, "step": 20774 }, { "epoch": 0.57, "learning_rate": 8.312512958174397e-06, "loss": 1.1279, "step": 20775 }, { "epoch": 0.57, "learning_rate": 8.31164114220524e-06, "loss": 1.4121, "step": 20776 }, { "epoch": 0.57, "learning_rate": 8.310769339445015e-06, "loss": 1.3677, "step": 20777 }, { "epoch": 0.57, "learning_rate": 8.30989754990053e-06, "loss": 1.2593, "step": 20778 }, { "epoch": 0.57, "learning_rate": 8.309025773578619e-06, "loss": 1.2327, "step": 20779 }, { "epoch": 0.57, "learning_rate": 8.308154010486089e-06, "loss": 1.2737, "step": 20780 }, { "epoch": 0.57, "learning_rate": 8.307282260629773e-06, "loss": 1.3503, "step": 20781 }, { "epoch": 0.57, "learning_rate": 8.306410524016475e-06, "loss": 1.3123, "step": 20782 }, { "epoch": 0.57, "learning_rate": 8.30553880065303e-06, "loss": 1.1692, "step": 20783 }, { "epoch": 0.57, "learning_rate": 8.304667090546253e-06, "loss": 1.3401, "step": 20784 }, { "epoch": 0.57, "learning_rate": 8.303795393702962e-06, "loss": 1.4099, "step": 20785 }, { "epoch": 0.57, "learning_rate": 8.302923710129981e-06, "loss": 1.4001, "step": 20786 }, { "epoch": 0.57, "learning_rate": 8.302052039834125e-06, "loss": 1.1331, "step": 20787 }, { "epoch": 0.57, "learning_rate": 8.301180382822215e-06, "loss": 1.3162, "step": 20788 }, { "epoch": 0.57, "learning_rate": 8.300308739101071e-06, "loss": 1.2224, "step": 20789 }, { "epoch": 0.57, "learning_rate": 8.299437108677515e-06, "loss": 1.21, "step": 20790 }, { "epoch": 0.57, "learning_rate": 8.298565491558359e-06, "loss": 1.3337, "step": 20791 }, { "epoch": 0.57, "learning_rate": 8.29769388775043e-06, "loss": 1.0786, "step": 20792 }, { "epoch": 0.57, "learning_rate": 8.296822297260541e-06, "loss": 1.2937, "step": 20793 }, { "epoch": 0.57, "learning_rate": 8.295950720095517e-06, "loss": 1.1797, "step": 20794 }, { "epoch": 0.57, "learning_rate": 8.295079156262168e-06, "loss": 1.3445, "step": 20795 }, { "epoch": 0.57, "learning_rate": 8.294207605767323e-06, "loss": 1.3203, "step": 20796 }, { "epoch": 0.57, "learning_rate": 8.293336068617793e-06, "loss": 1.2332, "step": 20797 }, { "epoch": 0.57, "learning_rate": 8.292464544820398e-06, "loss": 1.3359, "step": 20798 }, { "epoch": 0.57, "learning_rate": 8.291593034381961e-06, "loss": 1.3662, "step": 20799 }, { "epoch": 0.57, "learning_rate": 8.290721537309293e-06, "loss": 1.4214, "step": 20800 }, { "epoch": 0.57, "learning_rate": 8.289850053609218e-06, "loss": 1.3474, "step": 20801 }, { "epoch": 0.57, "learning_rate": 8.288978583288552e-06, "loss": 1.2908, "step": 20802 }, { "epoch": 0.57, "learning_rate": 8.288107126354114e-06, "loss": 1.4653, "step": 20803 }, { "epoch": 0.57, "learning_rate": 8.287235682812718e-06, "loss": 1.2683, "step": 20804 }, { "epoch": 0.57, "learning_rate": 8.286364252671188e-06, "loss": 1.373, "step": 20805 }, { "epoch": 0.57, "learning_rate": 8.285492835936335e-06, "loss": 1.2473, "step": 20806 }, { "epoch": 0.57, "learning_rate": 8.284621432614982e-06, "loss": 1.2939, "step": 20807 }, { "epoch": 0.57, "learning_rate": 8.283750042713942e-06, "loss": 1.2, "step": 20808 }, { "epoch": 0.57, "learning_rate": 8.282878666240038e-06, "loss": 1.2676, "step": 20809 }, { "epoch": 0.57, "learning_rate": 8.28200730320008e-06, "loss": 1.4478, "step": 20810 }, { "epoch": 0.57, "learning_rate": 8.281135953600893e-06, "loss": 1.2803, "step": 20811 }, { "epoch": 0.57, "learning_rate": 8.280264617449287e-06, "loss": 1.3096, "step": 20812 }, { "epoch": 0.57, "learning_rate": 8.27939329475208e-06, "loss": 1.3083, "step": 20813 }, { "epoch": 0.57, "learning_rate": 8.278521985516096e-06, "loss": 1.2258, "step": 20814 }, { "epoch": 0.57, "learning_rate": 8.277650689748142e-06, "loss": 1.3882, "step": 20815 }, { "epoch": 0.57, "learning_rate": 8.276779407455044e-06, "loss": 1.3806, "step": 20816 }, { "epoch": 0.57, "learning_rate": 8.27590813864361e-06, "loss": 1.2642, "step": 20817 }, { "epoch": 0.57, "learning_rate": 8.275036883320663e-06, "loss": 1.373, "step": 20818 }, { "epoch": 0.57, "learning_rate": 8.27416564149301e-06, "loss": 1.1897, "step": 20819 }, { "epoch": 0.57, "learning_rate": 8.273294413167482e-06, "loss": 1.2368, "step": 20820 }, { "epoch": 0.57, "learning_rate": 8.272423198350878e-06, "loss": 1.3652, "step": 20821 }, { "epoch": 0.57, "learning_rate": 8.27155199705003e-06, "loss": 1.3855, "step": 20822 }, { "epoch": 0.57, "learning_rate": 8.270680809271741e-06, "loss": 1.1553, "step": 20823 }, { "epoch": 0.57, "learning_rate": 8.269809635022836e-06, "loss": 1.3103, "step": 20824 }, { "epoch": 0.57, "learning_rate": 8.268938474310124e-06, "loss": 1.3237, "step": 20825 }, { "epoch": 0.57, "learning_rate": 8.268067327140426e-06, "loss": 1.147, "step": 20826 }, { "epoch": 0.57, "learning_rate": 8.267196193520552e-06, "loss": 1.2068, "step": 20827 }, { "epoch": 0.57, "learning_rate": 8.26632507345732e-06, "loss": 1.2812, "step": 20828 }, { "epoch": 0.57, "learning_rate": 8.265453966957548e-06, "loss": 1.2944, "step": 20829 }, { "epoch": 0.57, "learning_rate": 8.264582874028048e-06, "loss": 1.3462, "step": 20830 }, { "epoch": 0.57, "learning_rate": 8.263711794675635e-06, "loss": 1.377, "step": 20831 }, { "epoch": 0.57, "learning_rate": 8.262840728907124e-06, "loss": 1.3257, "step": 20832 }, { "epoch": 0.57, "learning_rate": 8.261969676729331e-06, "loss": 1.366, "step": 20833 }, { "epoch": 0.57, "learning_rate": 8.26109863814907e-06, "loss": 1.2095, "step": 20834 }, { "epoch": 0.57, "learning_rate": 8.260227613173156e-06, "loss": 1.313, "step": 20835 }, { "epoch": 0.57, "learning_rate": 8.259356601808402e-06, "loss": 1.405, "step": 20836 }, { "epoch": 0.57, "learning_rate": 8.258485604061624e-06, "loss": 1.3987, "step": 20837 }, { "epoch": 0.57, "learning_rate": 8.257614619939635e-06, "loss": 1.2063, "step": 20838 }, { "epoch": 0.57, "learning_rate": 8.256743649449252e-06, "loss": 1.2771, "step": 20839 }, { "epoch": 0.57, "learning_rate": 8.255872692597282e-06, "loss": 1.2546, "step": 20840 }, { "epoch": 0.57, "learning_rate": 8.255001749390549e-06, "loss": 1.2739, "step": 20841 }, { "epoch": 0.57, "learning_rate": 8.25413081983586e-06, "loss": 1.311, "step": 20842 }, { "epoch": 0.57, "learning_rate": 8.253259903940031e-06, "loss": 1.2825, "step": 20843 }, { "epoch": 0.57, "learning_rate": 8.252389001709874e-06, "loss": 1.322, "step": 20844 }, { "epoch": 0.57, "learning_rate": 8.251518113152204e-06, "loss": 1.2922, "step": 20845 }, { "epoch": 0.57, "learning_rate": 8.250647238273835e-06, "loss": 1.3293, "step": 20846 }, { "epoch": 0.57, "learning_rate": 8.249776377081578e-06, "loss": 1.1501, "step": 20847 }, { "epoch": 0.57, "learning_rate": 8.24890552958225e-06, "loss": 1.3425, "step": 20848 }, { "epoch": 0.57, "learning_rate": 8.248034695782659e-06, "loss": 1.2832, "step": 20849 }, { "epoch": 0.57, "learning_rate": 8.247163875689622e-06, "loss": 1.4226, "step": 20850 }, { "epoch": 0.57, "learning_rate": 8.24629306930995e-06, "loss": 1.1616, "step": 20851 }, { "epoch": 0.57, "learning_rate": 8.245422276650458e-06, "loss": 1.3916, "step": 20852 }, { "epoch": 0.57, "learning_rate": 8.244551497717954e-06, "loss": 1.2961, "step": 20853 }, { "epoch": 0.57, "learning_rate": 8.243680732519257e-06, "loss": 1.1772, "step": 20854 }, { "epoch": 0.57, "learning_rate": 8.242809981061174e-06, "loss": 1.3186, "step": 20855 }, { "epoch": 0.57, "learning_rate": 8.24193924335052e-06, "loss": 1.6392, "step": 20856 }, { "epoch": 0.57, "learning_rate": 8.241068519394104e-06, "loss": 1.2227, "step": 20857 }, { "epoch": 0.57, "learning_rate": 8.240197809198746e-06, "loss": 1.438, "step": 20858 }, { "epoch": 0.57, "learning_rate": 8.239327112771247e-06, "loss": 1.1836, "step": 20859 }, { "epoch": 0.57, "learning_rate": 8.238456430118428e-06, "loss": 1.2107, "step": 20860 }, { "epoch": 0.57, "learning_rate": 8.237585761247098e-06, "loss": 1.1519, "step": 20861 }, { "epoch": 0.57, "learning_rate": 8.236715106164068e-06, "loss": 1.2847, "step": 20862 }, { "epoch": 0.57, "learning_rate": 8.235844464876151e-06, "loss": 1.3735, "step": 20863 }, { "epoch": 0.57, "learning_rate": 8.234973837390154e-06, "loss": 1.3403, "step": 20864 }, { "epoch": 0.57, "learning_rate": 8.234103223712895e-06, "loss": 1.3359, "step": 20865 }, { "epoch": 0.57, "learning_rate": 8.233232623851179e-06, "loss": 1.2683, "step": 20866 }, { "epoch": 0.57, "learning_rate": 8.232362037811824e-06, "loss": 1.3022, "step": 20867 }, { "epoch": 0.57, "learning_rate": 8.231491465601634e-06, "loss": 1.2173, "step": 20868 }, { "epoch": 0.57, "learning_rate": 8.230620907227425e-06, "loss": 1.1741, "step": 20869 }, { "epoch": 0.57, "learning_rate": 8.229750362696005e-06, "loss": 1.2893, "step": 20870 }, { "epoch": 0.57, "learning_rate": 8.228879832014187e-06, "loss": 1.2517, "step": 20871 }, { "epoch": 0.57, "learning_rate": 8.228009315188779e-06, "loss": 1.2056, "step": 20872 }, { "epoch": 0.57, "learning_rate": 8.227138812226593e-06, "loss": 1.2278, "step": 20873 }, { "epoch": 0.57, "learning_rate": 8.226268323134438e-06, "loss": 1.3342, "step": 20874 }, { "epoch": 0.57, "learning_rate": 8.225397847919126e-06, "loss": 1.2705, "step": 20875 }, { "epoch": 0.57, "learning_rate": 8.22452738658747e-06, "loss": 1.4639, "step": 20876 }, { "epoch": 0.57, "learning_rate": 8.223656939146274e-06, "loss": 1.3743, "step": 20877 }, { "epoch": 0.57, "learning_rate": 8.222786505602352e-06, "loss": 1.2769, "step": 20878 }, { "epoch": 0.57, "learning_rate": 8.221916085962511e-06, "loss": 1.3223, "step": 20879 }, { "epoch": 0.57, "learning_rate": 8.221045680233565e-06, "loss": 1.179, "step": 20880 }, { "epoch": 0.57, "learning_rate": 8.220175288422318e-06, "loss": 1.3918, "step": 20881 }, { "epoch": 0.57, "learning_rate": 8.219304910535585e-06, "loss": 1.1665, "step": 20882 }, { "epoch": 0.57, "learning_rate": 8.218434546580172e-06, "loss": 1.3542, "step": 20883 }, { "epoch": 0.57, "learning_rate": 8.21756419656289e-06, "loss": 1.3325, "step": 20884 }, { "epoch": 0.57, "learning_rate": 8.216693860490547e-06, "loss": 1.304, "step": 20885 }, { "epoch": 0.57, "learning_rate": 8.215823538369953e-06, "loss": 1.1882, "step": 20886 }, { "epoch": 0.57, "learning_rate": 8.214953230207917e-06, "loss": 1.3052, "step": 20887 }, { "epoch": 0.57, "learning_rate": 8.214082936011247e-06, "loss": 0.9956, "step": 20888 }, { "epoch": 0.57, "learning_rate": 8.213212655786752e-06, "loss": 1.3157, "step": 20889 }, { "epoch": 0.57, "learning_rate": 8.21234238954124e-06, "loss": 1.1128, "step": 20890 }, { "epoch": 0.57, "learning_rate": 8.211472137281524e-06, "loss": 1.1438, "step": 20891 }, { "epoch": 0.57, "learning_rate": 8.210601899014404e-06, "loss": 1.3, "step": 20892 }, { "epoch": 0.57, "learning_rate": 8.2097316747467e-06, "loss": 1.1365, "step": 20893 }, { "epoch": 0.57, "learning_rate": 8.208861464485204e-06, "loss": 1.2841, "step": 20894 }, { "epoch": 0.57, "learning_rate": 8.207991268236744e-06, "loss": 1.2998, "step": 20895 }, { "epoch": 0.57, "learning_rate": 8.207121086008109e-06, "loss": 1.2546, "step": 20896 }, { "epoch": 0.57, "learning_rate": 8.206250917806124e-06, "loss": 1.2571, "step": 20897 }, { "epoch": 0.57, "learning_rate": 8.205380763637581e-06, "loss": 1.3408, "step": 20898 }, { "epoch": 0.57, "learning_rate": 8.2045106235093e-06, "loss": 1.312, "step": 20899 }, { "epoch": 0.57, "learning_rate": 8.203640497428079e-06, "loss": 1.2954, "step": 20900 }, { "epoch": 0.57, "learning_rate": 8.202770385400736e-06, "loss": 1.304, "step": 20901 }, { "epoch": 0.57, "learning_rate": 8.201900287434066e-06, "loss": 1.3118, "step": 20902 }, { "epoch": 0.57, "learning_rate": 8.201030203534889e-06, "loss": 1.3804, "step": 20903 }, { "epoch": 0.57, "learning_rate": 8.200160133709999e-06, "loss": 1.3413, "step": 20904 }, { "epoch": 0.57, "learning_rate": 8.199290077966215e-06, "loss": 1.2546, "step": 20905 }, { "epoch": 0.57, "learning_rate": 8.198420036310335e-06, "loss": 1.1743, "step": 20906 }, { "epoch": 0.57, "learning_rate": 8.19755000874917e-06, "loss": 1.3771, "step": 20907 }, { "epoch": 0.57, "learning_rate": 8.196679995289529e-06, "loss": 1.4868, "step": 20908 }, { "epoch": 0.57, "learning_rate": 8.195809995938214e-06, "loss": 1.231, "step": 20909 }, { "epoch": 0.57, "learning_rate": 8.194940010702032e-06, "loss": 1.3813, "step": 20910 }, { "epoch": 0.57, "learning_rate": 8.194070039587792e-06, "loss": 1.3, "step": 20911 }, { "epoch": 0.57, "learning_rate": 8.193200082602299e-06, "loss": 1.2017, "step": 20912 }, { "epoch": 0.57, "learning_rate": 8.192330139752359e-06, "loss": 1.2466, "step": 20913 }, { "epoch": 0.57, "learning_rate": 8.191460211044778e-06, "loss": 1.3091, "step": 20914 }, { "epoch": 0.57, "learning_rate": 8.19059029648636e-06, "loss": 1.2937, "step": 20915 }, { "epoch": 0.57, "learning_rate": 8.189720396083916e-06, "loss": 1.3044, "step": 20916 }, { "epoch": 0.57, "learning_rate": 8.188850509844246e-06, "loss": 1.4478, "step": 20917 }, { "epoch": 0.57, "learning_rate": 8.18798063777416e-06, "loss": 1.1694, "step": 20918 }, { "epoch": 0.57, "learning_rate": 8.187110779880457e-06, "loss": 1.373, "step": 20919 }, { "epoch": 0.57, "learning_rate": 8.186240936169952e-06, "loss": 1.1735, "step": 20920 }, { "epoch": 0.57, "learning_rate": 8.185371106649441e-06, "loss": 1.2405, "step": 20921 }, { "epoch": 0.57, "learning_rate": 8.184501291325734e-06, "loss": 1.4341, "step": 20922 }, { "epoch": 0.57, "learning_rate": 8.183631490205636e-06, "loss": 1.2419, "step": 20923 }, { "epoch": 0.57, "learning_rate": 8.182761703295951e-06, "loss": 1.2256, "step": 20924 }, { "epoch": 0.57, "learning_rate": 8.181891930603485e-06, "loss": 1.3054, "step": 20925 }, { "epoch": 0.57, "learning_rate": 8.18102217213504e-06, "loss": 1.2454, "step": 20926 }, { "epoch": 0.57, "learning_rate": 8.180152427897425e-06, "loss": 1.2483, "step": 20927 }, { "epoch": 0.57, "learning_rate": 8.179282697897437e-06, "loss": 1.3977, "step": 20928 }, { "epoch": 0.57, "learning_rate": 8.17841298214189e-06, "loss": 1.1646, "step": 20929 }, { "epoch": 0.57, "learning_rate": 8.177543280637579e-06, "loss": 1.2544, "step": 20930 }, { "epoch": 0.57, "learning_rate": 8.176673593391315e-06, "loss": 1.1189, "step": 20931 }, { "epoch": 0.57, "learning_rate": 8.175803920409897e-06, "loss": 1.3223, "step": 20932 }, { "epoch": 0.57, "learning_rate": 8.174934261700135e-06, "loss": 1.2622, "step": 20933 }, { "epoch": 0.57, "learning_rate": 8.174064617268825e-06, "loss": 1.301, "step": 20934 }, { "epoch": 0.57, "learning_rate": 8.17319498712278e-06, "loss": 1.7866, "step": 20935 }, { "epoch": 0.57, "learning_rate": 8.172325371268793e-06, "loss": 1.1121, "step": 20936 }, { "epoch": 0.57, "learning_rate": 8.171455769713672e-06, "loss": 1.3206, "step": 20937 }, { "epoch": 0.57, "learning_rate": 8.170586182464227e-06, "loss": 1.4546, "step": 20938 }, { "epoch": 0.57, "learning_rate": 8.16971660952725e-06, "loss": 1.2388, "step": 20939 }, { "epoch": 0.57, "learning_rate": 8.168847050909556e-06, "loss": 1.2976, "step": 20940 }, { "epoch": 0.57, "learning_rate": 8.167977506617935e-06, "loss": 1.374, "step": 20941 }, { "epoch": 0.57, "learning_rate": 8.167107976659203e-06, "loss": 1.3584, "step": 20942 }, { "epoch": 0.57, "learning_rate": 8.166238461040147e-06, "loss": 1.2834, "step": 20943 }, { "epoch": 0.57, "learning_rate": 8.16536895976759e-06, "loss": 1.2095, "step": 20944 }, { "epoch": 0.57, "learning_rate": 8.164499472848315e-06, "loss": 1.2163, "step": 20945 }, { "epoch": 0.57, "learning_rate": 8.16363000028914e-06, "loss": 1.2405, "step": 20946 }, { "epoch": 0.57, "learning_rate": 8.162760542096853e-06, "loss": 1.2168, "step": 20947 }, { "epoch": 0.57, "learning_rate": 8.161891098278271e-06, "loss": 1.343, "step": 20948 }, { "epoch": 0.57, "learning_rate": 8.161021668840181e-06, "loss": 1.2551, "step": 20949 }, { "epoch": 0.57, "learning_rate": 8.1601522537894e-06, "loss": 1.218, "step": 20950 }, { "epoch": 0.57, "learning_rate": 8.159282853132717e-06, "loss": 1.3447, "step": 20951 }, { "epoch": 0.57, "learning_rate": 8.15841346687694e-06, "loss": 1.2388, "step": 20952 }, { "epoch": 0.57, "learning_rate": 8.157544095028873e-06, "loss": 1.3762, "step": 20953 }, { "epoch": 0.57, "learning_rate": 8.156674737595313e-06, "loss": 1.2556, "step": 20954 }, { "epoch": 0.57, "learning_rate": 8.155805394583064e-06, "loss": 1.1353, "step": 20955 }, { "epoch": 0.57, "learning_rate": 8.154936065998924e-06, "loss": 1.1331, "step": 20956 }, { "epoch": 0.57, "learning_rate": 8.154066751849701e-06, "loss": 1.4546, "step": 20957 }, { "epoch": 0.57, "learning_rate": 8.153197452142188e-06, "loss": 1.4265, "step": 20958 }, { "epoch": 0.57, "learning_rate": 8.152328166883192e-06, "loss": 1.218, "step": 20959 }, { "epoch": 0.57, "learning_rate": 8.151458896079509e-06, "loss": 1.2656, "step": 20960 }, { "epoch": 0.57, "learning_rate": 8.150589639737945e-06, "loss": 1.1638, "step": 20961 }, { "epoch": 0.57, "learning_rate": 8.149720397865294e-06, "loss": 1.4373, "step": 20962 }, { "epoch": 0.57, "learning_rate": 8.148851170468366e-06, "loss": 1.2366, "step": 20963 }, { "epoch": 0.57, "learning_rate": 8.147981957553952e-06, "loss": 1.2454, "step": 20964 }, { "epoch": 0.57, "learning_rate": 8.147112759128859e-06, "loss": 1.2974, "step": 20965 }, { "epoch": 0.57, "learning_rate": 8.146243575199882e-06, "loss": 1.3994, "step": 20966 }, { "epoch": 0.57, "learning_rate": 8.145374405773826e-06, "loss": 1.2173, "step": 20967 }, { "epoch": 0.57, "learning_rate": 8.144505250857486e-06, "loss": 1.1682, "step": 20968 }, { "epoch": 0.57, "learning_rate": 8.143636110457665e-06, "loss": 1.2698, "step": 20969 }, { "epoch": 0.57, "learning_rate": 8.142766984581164e-06, "loss": 1.3003, "step": 20970 }, { "epoch": 0.57, "learning_rate": 8.141897873234777e-06, "loss": 1.2439, "step": 20971 }, { "epoch": 0.57, "learning_rate": 8.141028776425311e-06, "loss": 1.2197, "step": 20972 }, { "epoch": 0.57, "learning_rate": 8.14015969415956e-06, "loss": 1.2881, "step": 20973 }, { "epoch": 0.57, "learning_rate": 8.139290626444327e-06, "loss": 1.269, "step": 20974 }, { "epoch": 0.57, "learning_rate": 8.138421573286407e-06, "loss": 1.4219, "step": 20975 }, { "epoch": 0.57, "learning_rate": 8.137552534692603e-06, "loss": 1.1263, "step": 20976 }, { "epoch": 0.57, "learning_rate": 8.13668351066971e-06, "loss": 1.4758, "step": 20977 }, { "epoch": 0.57, "learning_rate": 8.13581450122453e-06, "loss": 1.0618, "step": 20978 }, { "epoch": 0.57, "learning_rate": 8.13494550636386e-06, "loss": 1.2324, "step": 20979 }, { "epoch": 0.57, "learning_rate": 8.134076526094501e-06, "loss": 1.2214, "step": 20980 }, { "epoch": 0.57, "learning_rate": 8.133207560423249e-06, "loss": 1.8203, "step": 20981 }, { "epoch": 0.57, "learning_rate": 8.132338609356904e-06, "loss": 1.3052, "step": 20982 }, { "epoch": 0.57, "learning_rate": 8.131469672902262e-06, "loss": 1.3835, "step": 20983 }, { "epoch": 0.57, "learning_rate": 8.13060075106612e-06, "loss": 1.1628, "step": 20984 }, { "epoch": 0.57, "learning_rate": 8.129731843855287e-06, "loss": 1.3323, "step": 20985 }, { "epoch": 0.57, "learning_rate": 8.128862951276544e-06, "loss": 1.1506, "step": 20986 }, { "epoch": 0.57, "learning_rate": 8.127994073336703e-06, "loss": 1.2183, "step": 20987 }, { "epoch": 0.57, "learning_rate": 8.127125210042552e-06, "loss": 1.3032, "step": 20988 }, { "epoch": 0.57, "learning_rate": 8.126256361400898e-06, "loss": 1.2148, "step": 20989 }, { "epoch": 0.57, "learning_rate": 8.125387527418527e-06, "loss": 1.3853, "step": 20990 }, { "epoch": 0.57, "learning_rate": 8.124518708102248e-06, "loss": 1.3364, "step": 20991 }, { "epoch": 0.57, "learning_rate": 8.123649903458849e-06, "loss": 1.2847, "step": 20992 }, { "epoch": 0.57, "learning_rate": 8.122781113495135e-06, "loss": 1.2537, "step": 20993 }, { "epoch": 0.57, "learning_rate": 8.121912338217891e-06, "loss": 1.1349, "step": 20994 }, { "epoch": 0.57, "learning_rate": 8.12104357763393e-06, "loss": 1.7178, "step": 20995 }, { "epoch": 0.57, "learning_rate": 8.120174831750035e-06, "loss": 1.2185, "step": 20996 }, { "epoch": 0.57, "learning_rate": 8.119306100573013e-06, "loss": 1.3774, "step": 20997 }, { "epoch": 0.57, "learning_rate": 8.11843738410965e-06, "loss": 1.3979, "step": 20998 }, { "epoch": 0.57, "learning_rate": 8.117568682366748e-06, "loss": 1.2676, "step": 20999 }, { "epoch": 0.57, "learning_rate": 8.11669999535111e-06, "loss": 1.3562, "step": 21000 }, { "epoch": 0.57, "learning_rate": 8.115831323069519e-06, "loss": 1.2051, "step": 21001 }, { "epoch": 0.57, "learning_rate": 8.114962665528783e-06, "loss": 1.2769, "step": 21002 }, { "epoch": 0.57, "learning_rate": 8.114094022735688e-06, "loss": 1.2832, "step": 21003 }, { "epoch": 0.57, "learning_rate": 8.11322539469704e-06, "loss": 1.1775, "step": 21004 }, { "epoch": 0.57, "learning_rate": 8.112356781419625e-06, "loss": 1.3545, "step": 21005 }, { "epoch": 0.57, "learning_rate": 8.111488182910245e-06, "loss": 1.2139, "step": 21006 }, { "epoch": 0.57, "learning_rate": 8.110619599175693e-06, "loss": 1.1833, "step": 21007 }, { "epoch": 0.57, "learning_rate": 8.109751030222765e-06, "loss": 1.3218, "step": 21008 }, { "epoch": 0.57, "learning_rate": 8.108882476058255e-06, "loss": 1.6904, "step": 21009 }, { "epoch": 0.57, "learning_rate": 8.10801393668896e-06, "loss": 1.228, "step": 21010 }, { "epoch": 0.57, "learning_rate": 8.107145412121674e-06, "loss": 1.2932, "step": 21011 }, { "epoch": 0.57, "learning_rate": 8.106276902363193e-06, "loss": 1.2183, "step": 21012 }, { "epoch": 0.57, "learning_rate": 8.10540840742031e-06, "loss": 1.2852, "step": 21013 }, { "epoch": 0.57, "learning_rate": 8.104539927299819e-06, "loss": 1.0574, "step": 21014 }, { "epoch": 0.57, "learning_rate": 8.10367146200852e-06, "loss": 1.2527, "step": 21015 }, { "epoch": 0.57, "learning_rate": 8.1028030115532e-06, "loss": 1.2192, "step": 21016 }, { "epoch": 0.57, "learning_rate": 8.101934575940661e-06, "loss": 1.3542, "step": 21017 }, { "epoch": 0.57, "learning_rate": 8.101066155177691e-06, "loss": 1.376, "step": 21018 }, { "epoch": 0.57, "learning_rate": 8.100197749271089e-06, "loss": 1.3025, "step": 21019 }, { "epoch": 0.57, "learning_rate": 8.099329358227643e-06, "loss": 1.3115, "step": 21020 }, { "epoch": 0.57, "learning_rate": 8.098460982054152e-06, "loss": 1.2926, "step": 21021 }, { "epoch": 0.57, "learning_rate": 8.097592620757408e-06, "loss": 1.0764, "step": 21022 }, { "epoch": 0.57, "learning_rate": 8.096724274344206e-06, "loss": 1.3364, "step": 21023 }, { "epoch": 0.57, "learning_rate": 8.095855942821335e-06, "loss": 1.2711, "step": 21024 }, { "epoch": 0.57, "learning_rate": 8.094987626195595e-06, "loss": 1.1797, "step": 21025 }, { "epoch": 0.57, "learning_rate": 8.094119324473775e-06, "loss": 1.229, "step": 21026 }, { "epoch": 0.57, "learning_rate": 8.09325103766267e-06, "loss": 1.2244, "step": 21027 }, { "epoch": 0.57, "learning_rate": 8.09238276576907e-06, "loss": 1.3237, "step": 21028 }, { "epoch": 0.57, "learning_rate": 8.091514508799773e-06, "loss": 1.2673, "step": 21029 }, { "epoch": 0.57, "learning_rate": 8.090646266761566e-06, "loss": 1.2039, "step": 21030 }, { "epoch": 0.57, "learning_rate": 8.089778039661242e-06, "loss": 1.3032, "step": 21031 }, { "epoch": 0.57, "learning_rate": 8.088909827505605e-06, "loss": 1.6685, "step": 21032 }, { "epoch": 0.57, "learning_rate": 8.088041630301431e-06, "loss": 1.1707, "step": 21033 }, { "epoch": 0.57, "learning_rate": 8.087173448055527e-06, "loss": 1.2944, "step": 21034 }, { "epoch": 0.57, "learning_rate": 8.086305280774672e-06, "loss": 1.2441, "step": 21035 }, { "epoch": 0.57, "learning_rate": 8.085437128465672e-06, "loss": 1.2213, "step": 21036 }, { "epoch": 0.57, "learning_rate": 8.084568991135305e-06, "loss": 1.3511, "step": 21037 }, { "epoch": 0.57, "learning_rate": 8.083700868790374e-06, "loss": 1.2908, "step": 21038 }, { "epoch": 0.57, "learning_rate": 8.082832761437662e-06, "loss": 1.4824, "step": 21039 }, { "epoch": 0.57, "learning_rate": 8.08196466908397e-06, "loss": 1.219, "step": 21040 }, { "epoch": 0.57, "learning_rate": 8.081096591736077e-06, "loss": 1.2207, "step": 21041 }, { "epoch": 0.57, "learning_rate": 8.08022852940079e-06, "loss": 1.1692, "step": 21042 }, { "epoch": 0.57, "learning_rate": 8.079360482084885e-06, "loss": 1.2927, "step": 21043 }, { "epoch": 0.57, "learning_rate": 8.078492449795168e-06, "loss": 1.2561, "step": 21044 }, { "epoch": 0.57, "learning_rate": 8.077624432538417e-06, "loss": 1.249, "step": 21045 }, { "epoch": 0.57, "learning_rate": 8.076756430321428e-06, "loss": 1.2214, "step": 21046 }, { "epoch": 0.57, "learning_rate": 8.075888443150996e-06, "loss": 1.1816, "step": 21047 }, { "epoch": 0.57, "learning_rate": 8.075020471033907e-06, "loss": 1.3079, "step": 21048 }, { "epoch": 0.57, "learning_rate": 8.074152513976953e-06, "loss": 1.2942, "step": 21049 }, { "epoch": 0.57, "learning_rate": 8.073284571986922e-06, "loss": 1.2979, "step": 21050 }, { "epoch": 0.57, "learning_rate": 8.072416645070609e-06, "loss": 1.1472, "step": 21051 }, { "epoch": 0.57, "learning_rate": 8.0715487332348e-06, "loss": 1.2444, "step": 21052 }, { "epoch": 0.57, "learning_rate": 8.070680836486288e-06, "loss": 1.3245, "step": 21053 }, { "epoch": 0.57, "learning_rate": 8.06981295483186e-06, "loss": 1.2034, "step": 21054 }, { "epoch": 0.57, "learning_rate": 8.068945088278312e-06, "loss": 1.3, "step": 21055 }, { "epoch": 0.58, "learning_rate": 8.068077236832425e-06, "loss": 1.2981, "step": 21056 }, { "epoch": 0.58, "learning_rate": 8.067209400500995e-06, "loss": 1.2922, "step": 21057 }, { "epoch": 0.58, "learning_rate": 8.066341579290811e-06, "loss": 1.3188, "step": 21058 }, { "epoch": 0.58, "learning_rate": 8.065473773208661e-06, "loss": 1.2527, "step": 21059 }, { "epoch": 0.58, "learning_rate": 8.064605982261331e-06, "loss": 1.3569, "step": 21060 }, { "epoch": 0.58, "learning_rate": 8.063738206455615e-06, "loss": 1.1743, "step": 21061 }, { "epoch": 0.58, "learning_rate": 8.062870445798304e-06, "loss": 1.2612, "step": 21062 }, { "epoch": 0.58, "learning_rate": 8.06200270029618e-06, "loss": 1.2908, "step": 21063 }, { "epoch": 0.58, "learning_rate": 8.06113496995604e-06, "loss": 1.157, "step": 21064 }, { "epoch": 0.58, "learning_rate": 8.060267254784666e-06, "loss": 1.7451, "step": 21065 }, { "epoch": 0.58, "learning_rate": 8.059399554788849e-06, "loss": 1.3, "step": 21066 }, { "epoch": 0.58, "learning_rate": 8.058531869975376e-06, "loss": 1.3408, "step": 21067 }, { "epoch": 0.58, "learning_rate": 8.057664200351038e-06, "loss": 1.2585, "step": 21068 }, { "epoch": 0.58, "learning_rate": 8.05679654592262e-06, "loss": 1.4238, "step": 21069 }, { "epoch": 0.58, "learning_rate": 8.055928906696915e-06, "loss": 1.3364, "step": 21070 }, { "epoch": 0.58, "learning_rate": 8.055061282680705e-06, "loss": 1.2231, "step": 21071 }, { "epoch": 0.58, "learning_rate": 8.054193673880784e-06, "loss": 1.2581, "step": 21072 }, { "epoch": 0.58, "learning_rate": 8.053326080303935e-06, "loss": 1.2722, "step": 21073 }, { "epoch": 0.58, "learning_rate": 8.052458501956949e-06, "loss": 1.293, "step": 21074 }, { "epoch": 0.58, "learning_rate": 8.05159093884661e-06, "loss": 1.269, "step": 21075 }, { "epoch": 0.58, "learning_rate": 8.050723390979704e-06, "loss": 1.23, "step": 21076 }, { "epoch": 0.58, "learning_rate": 8.049855858363029e-06, "loss": 1.4043, "step": 21077 }, { "epoch": 0.58, "learning_rate": 8.048988341003358e-06, "loss": 1.3318, "step": 21078 }, { "epoch": 0.58, "learning_rate": 8.048120838907492e-06, "loss": 1.2717, "step": 21079 }, { "epoch": 0.58, "learning_rate": 8.047253352082202e-06, "loss": 1.7305, "step": 21080 }, { "epoch": 0.58, "learning_rate": 8.046385880534292e-06, "loss": 1.376, "step": 21081 }, { "epoch": 0.58, "learning_rate": 8.045518424270533e-06, "loss": 1.3198, "step": 21082 }, { "epoch": 0.58, "learning_rate": 8.044650983297725e-06, "loss": 1.2656, "step": 21083 }, { "epoch": 0.58, "learning_rate": 8.043783557622642e-06, "loss": 1.2583, "step": 21084 }, { "epoch": 0.58, "learning_rate": 8.042916147252085e-06, "loss": 1.2969, "step": 21085 }, { "epoch": 0.58, "learning_rate": 8.042048752192823e-06, "loss": 1.241, "step": 21086 }, { "epoch": 0.58, "learning_rate": 8.041181372451656e-06, "loss": 1.1743, "step": 21087 }, { "epoch": 0.58, "learning_rate": 8.040314008035363e-06, "loss": 1.2983, "step": 21088 }, { "epoch": 0.58, "learning_rate": 8.039446658950734e-06, "loss": 1.1816, "step": 21089 }, { "epoch": 0.58, "learning_rate": 8.038579325204548e-06, "loss": 1.3052, "step": 21090 }, { "epoch": 0.58, "learning_rate": 8.0377120068036e-06, "loss": 1.2808, "step": 21091 }, { "epoch": 0.58, "learning_rate": 8.036844703754667e-06, "loss": 1.3298, "step": 21092 }, { "epoch": 0.58, "learning_rate": 8.035977416064538e-06, "loss": 1.3254, "step": 21093 }, { "epoch": 0.58, "learning_rate": 8.03511014374e-06, "loss": 1.3374, "step": 21094 }, { "epoch": 0.58, "learning_rate": 8.034242886787836e-06, "loss": 1.4272, "step": 21095 }, { "epoch": 0.58, "learning_rate": 8.03337564521483e-06, "loss": 1.2698, "step": 21096 }, { "epoch": 0.58, "learning_rate": 8.03250841902777e-06, "loss": 1.1555, "step": 21097 }, { "epoch": 0.58, "learning_rate": 8.031641208233438e-06, "loss": 1.1729, "step": 21098 }, { "epoch": 0.58, "learning_rate": 8.030774012838617e-06, "loss": 1.4824, "step": 21099 }, { "epoch": 0.58, "learning_rate": 8.029906832850098e-06, "loss": 1.4224, "step": 21100 }, { "epoch": 0.58, "learning_rate": 8.02903966827466e-06, "loss": 1.7231, "step": 21101 }, { "epoch": 0.58, "learning_rate": 8.02817251911909e-06, "loss": 1.2422, "step": 21102 }, { "epoch": 0.58, "learning_rate": 8.02730538539017e-06, "loss": 1.2485, "step": 21103 }, { "epoch": 0.58, "learning_rate": 8.026438267094685e-06, "loss": 1.1368, "step": 21104 }, { "epoch": 0.58, "learning_rate": 8.025571164239418e-06, "loss": 1.2585, "step": 21105 }, { "epoch": 0.58, "learning_rate": 8.024704076831157e-06, "loss": 1.2913, "step": 21106 }, { "epoch": 0.58, "learning_rate": 8.02383700487668e-06, "loss": 1.3262, "step": 21107 }, { "epoch": 0.58, "learning_rate": 8.02296994838277e-06, "loss": 1.4775, "step": 21108 }, { "epoch": 0.58, "learning_rate": 8.02210290735622e-06, "loss": 1.3093, "step": 21109 }, { "epoch": 0.58, "learning_rate": 8.021235881803802e-06, "loss": 1.2896, "step": 21110 }, { "epoch": 0.58, "learning_rate": 8.020368871732305e-06, "loss": 1.3191, "step": 21111 }, { "epoch": 0.58, "learning_rate": 8.019501877148512e-06, "loss": 1.3386, "step": 21112 }, { "epoch": 0.58, "learning_rate": 8.018634898059206e-06, "loss": 1.4116, "step": 21113 }, { "epoch": 0.58, "learning_rate": 8.017767934471165e-06, "loss": 1.1707, "step": 21114 }, { "epoch": 0.58, "learning_rate": 8.01690098639118e-06, "loss": 1.2473, "step": 21115 }, { "epoch": 0.58, "learning_rate": 8.016034053826025e-06, "loss": 1.3088, "step": 21116 }, { "epoch": 0.58, "learning_rate": 8.015167136782491e-06, "loss": 1.407, "step": 21117 }, { "epoch": 0.58, "learning_rate": 8.014300235267352e-06, "loss": 1.3792, "step": 21118 }, { "epoch": 0.58, "learning_rate": 8.013433349287399e-06, "loss": 1.2891, "step": 21119 }, { "epoch": 0.58, "learning_rate": 8.012566478849401e-06, "loss": 1.3306, "step": 21120 }, { "epoch": 0.58, "learning_rate": 8.011699623960157e-06, "loss": 1.2827, "step": 21121 }, { "epoch": 0.58, "learning_rate": 8.010832784626435e-06, "loss": 1.344, "step": 21122 }, { "epoch": 0.58, "learning_rate": 8.009965960855021e-06, "loss": 1.167, "step": 21123 }, { "epoch": 0.58, "learning_rate": 8.009099152652703e-06, "loss": 1.27, "step": 21124 }, { "epoch": 0.58, "learning_rate": 8.008232360026253e-06, "loss": 1.3162, "step": 21125 }, { "epoch": 0.58, "learning_rate": 8.007365582982459e-06, "loss": 1.2849, "step": 21126 }, { "epoch": 0.58, "learning_rate": 8.006498821528097e-06, "loss": 1.3765, "step": 21127 }, { "epoch": 0.58, "learning_rate": 8.005632075669954e-06, "loss": 1.0911, "step": 21128 }, { "epoch": 0.58, "learning_rate": 8.004765345414804e-06, "loss": 1.2637, "step": 21129 }, { "epoch": 0.58, "learning_rate": 8.003898630769436e-06, "loss": 1.335, "step": 21130 }, { "epoch": 0.58, "learning_rate": 8.003031931740622e-06, "loss": 1.2761, "step": 21131 }, { "epoch": 0.58, "learning_rate": 8.002165248335151e-06, "loss": 1.3684, "step": 21132 }, { "epoch": 0.58, "learning_rate": 8.001298580559798e-06, "loss": 1.3064, "step": 21133 }, { "epoch": 0.58, "learning_rate": 8.000431928421345e-06, "loss": 1.2297, "step": 21134 }, { "epoch": 0.58, "learning_rate": 7.999565291926573e-06, "loss": 1.2141, "step": 21135 }, { "epoch": 0.58, "learning_rate": 7.99869867108226e-06, "loss": 1.3152, "step": 21136 }, { "epoch": 0.58, "learning_rate": 7.997832065895188e-06, "loss": 1.1493, "step": 21137 }, { "epoch": 0.58, "learning_rate": 7.996965476372137e-06, "loss": 1.3657, "step": 21138 }, { "epoch": 0.58, "learning_rate": 7.996098902519886e-06, "loss": 1.1804, "step": 21139 }, { "epoch": 0.58, "learning_rate": 7.995232344345214e-06, "loss": 1.3147, "step": 21140 }, { "epoch": 0.58, "learning_rate": 7.994365801854904e-06, "loss": 1.4167, "step": 21141 }, { "epoch": 0.58, "learning_rate": 7.99349927505573e-06, "loss": 1.2593, "step": 21142 }, { "epoch": 0.58, "learning_rate": 7.992632763954476e-06, "loss": 1.3782, "step": 21143 }, { "epoch": 0.58, "learning_rate": 7.991766268557917e-06, "loss": 1.3955, "step": 21144 }, { "epoch": 0.58, "learning_rate": 7.990899788872838e-06, "loss": 1.366, "step": 21145 }, { "epoch": 0.58, "learning_rate": 7.990033324906011e-06, "loss": 1.3708, "step": 21146 }, { "epoch": 0.58, "learning_rate": 7.98916687666422e-06, "loss": 1.312, "step": 21147 }, { "epoch": 0.58, "learning_rate": 7.988300444154241e-06, "loss": 1.3511, "step": 21148 }, { "epoch": 0.58, "learning_rate": 7.987434027382856e-06, "loss": 1.3335, "step": 21149 }, { "epoch": 0.58, "learning_rate": 7.986567626356836e-06, "loss": 1.2458, "step": 21150 }, { "epoch": 0.58, "learning_rate": 7.985701241082968e-06, "loss": 1.2793, "step": 21151 }, { "epoch": 0.58, "learning_rate": 7.984834871568024e-06, "loss": 1.3403, "step": 21152 }, { "epoch": 0.58, "learning_rate": 7.983968517818787e-06, "loss": 1.1316, "step": 21153 }, { "epoch": 0.58, "learning_rate": 7.983102179842029e-06, "loss": 1.2771, "step": 21154 }, { "epoch": 0.58, "learning_rate": 7.982235857644529e-06, "loss": 1.7925, "step": 21155 }, { "epoch": 0.58, "learning_rate": 7.981369551233074e-06, "loss": 1.1414, "step": 21156 }, { "epoch": 0.58, "learning_rate": 7.980503260614427e-06, "loss": 1.283, "step": 21157 }, { "epoch": 0.58, "learning_rate": 7.97963698579538e-06, "loss": 1.2244, "step": 21158 }, { "epoch": 0.58, "learning_rate": 7.978770726782697e-06, "loss": 1.2202, "step": 21159 }, { "epoch": 0.58, "learning_rate": 7.97790448358317e-06, "loss": 1.134, "step": 21160 }, { "epoch": 0.58, "learning_rate": 7.977038256203557e-06, "loss": 1.7505, "step": 21161 }, { "epoch": 0.58, "learning_rate": 7.976172044650654e-06, "loss": 1.2516, "step": 21162 }, { "epoch": 0.58, "learning_rate": 7.975305848931223e-06, "loss": 1.2544, "step": 21163 }, { "epoch": 0.58, "learning_rate": 7.974439669052053e-06, "loss": 1.3413, "step": 21164 }, { "epoch": 0.58, "learning_rate": 7.973573505019905e-06, "loss": 1.3142, "step": 21165 }, { "epoch": 0.58, "learning_rate": 7.972707356841575e-06, "loss": 1.1792, "step": 21166 }, { "epoch": 0.58, "learning_rate": 7.971841224523822e-06, "loss": 1.2339, "step": 21167 }, { "epoch": 0.58, "learning_rate": 7.970975108073437e-06, "loss": 1.2402, "step": 21168 }, { "epoch": 0.58, "learning_rate": 7.970109007497182e-06, "loss": 1.2612, "step": 21169 }, { "epoch": 0.58, "learning_rate": 7.96924292280184e-06, "loss": 1.3447, "step": 21170 }, { "epoch": 0.58, "learning_rate": 7.96837685399419e-06, "loss": 1.2683, "step": 21171 }, { "epoch": 0.58, "learning_rate": 7.967510801081002e-06, "loss": 1.2964, "step": 21172 }, { "epoch": 0.58, "learning_rate": 7.966644764069055e-06, "loss": 1.2571, "step": 21173 }, { "epoch": 0.58, "learning_rate": 7.965778742965121e-06, "loss": 1.3179, "step": 21174 }, { "epoch": 0.58, "learning_rate": 7.96491273777598e-06, "loss": 1.249, "step": 21175 }, { "epoch": 0.58, "learning_rate": 7.964046748508404e-06, "loss": 1.2034, "step": 21176 }, { "epoch": 0.58, "learning_rate": 7.96318077516917e-06, "loss": 1.3682, "step": 21177 }, { "epoch": 0.58, "learning_rate": 7.96231481776505e-06, "loss": 1.2925, "step": 21178 }, { "epoch": 0.58, "learning_rate": 7.961448876302822e-06, "loss": 1.4087, "step": 21179 }, { "epoch": 0.58, "learning_rate": 7.960582950789258e-06, "loss": 1.3882, "step": 21180 }, { "epoch": 0.58, "learning_rate": 7.959717041231137e-06, "loss": 1.2966, "step": 21181 }, { "epoch": 0.58, "learning_rate": 7.958851147635226e-06, "loss": 1.1509, "step": 21182 }, { "epoch": 0.58, "learning_rate": 7.957985270008308e-06, "loss": 1.2466, "step": 21183 }, { "epoch": 0.58, "learning_rate": 7.95711940835715e-06, "loss": 1.2986, "step": 21184 }, { "epoch": 0.58, "learning_rate": 7.956253562688529e-06, "loss": 1.2378, "step": 21185 }, { "epoch": 0.58, "learning_rate": 7.95538773300922e-06, "loss": 1.1462, "step": 21186 }, { "epoch": 0.58, "learning_rate": 7.954521919325995e-06, "loss": 1.2415, "step": 21187 }, { "epoch": 0.58, "learning_rate": 7.953656121645632e-06, "loss": 1.2046, "step": 21188 }, { "epoch": 0.58, "learning_rate": 7.952790339974899e-06, "loss": 1.3269, "step": 21189 }, { "epoch": 0.58, "learning_rate": 7.951924574320573e-06, "loss": 1.3174, "step": 21190 }, { "epoch": 0.58, "learning_rate": 7.951058824689424e-06, "loss": 1.2678, "step": 21191 }, { "epoch": 0.58, "learning_rate": 7.950193091088227e-06, "loss": 1.2888, "step": 21192 }, { "epoch": 0.58, "learning_rate": 7.949327373523756e-06, "loss": 1.1932, "step": 21193 }, { "epoch": 0.58, "learning_rate": 7.948461672002786e-06, "loss": 1.2241, "step": 21194 }, { "epoch": 0.58, "learning_rate": 7.947595986532084e-06, "loss": 1.4121, "step": 21195 }, { "epoch": 0.58, "learning_rate": 7.946730317118427e-06, "loss": 1.377, "step": 21196 }, { "epoch": 0.58, "learning_rate": 7.945864663768585e-06, "loss": 1.3477, "step": 21197 }, { "epoch": 0.58, "learning_rate": 7.944999026489336e-06, "loss": 1.1389, "step": 21198 }, { "epoch": 0.58, "learning_rate": 7.944133405287445e-06, "loss": 1.3059, "step": 21199 }, { "epoch": 0.58, "learning_rate": 7.943267800169688e-06, "loss": 1.0647, "step": 21200 }, { "epoch": 0.58, "learning_rate": 7.942402211142836e-06, "loss": 1.356, "step": 21201 }, { "epoch": 0.58, "learning_rate": 7.941536638213658e-06, "loss": 1.2871, "step": 21202 }, { "epoch": 0.58, "learning_rate": 7.940671081388937e-06, "loss": 1.3337, "step": 21203 }, { "epoch": 0.58, "learning_rate": 7.939805540675432e-06, "loss": 1.3401, "step": 21204 }, { "epoch": 0.58, "learning_rate": 7.938940016079925e-06, "loss": 1.2849, "step": 21205 }, { "epoch": 0.58, "learning_rate": 7.938074507609174e-06, "loss": 1.4062, "step": 21206 }, { "epoch": 0.58, "learning_rate": 7.937209015269967e-06, "loss": 1.2722, "step": 21207 }, { "epoch": 0.58, "learning_rate": 7.936343539069059e-06, "loss": 1.4858, "step": 21208 }, { "epoch": 0.58, "learning_rate": 7.935478079013236e-06, "loss": 1.3564, "step": 21209 }, { "epoch": 0.58, "learning_rate": 7.934612635109256e-06, "loss": 1.2605, "step": 21210 }, { "epoch": 0.58, "learning_rate": 7.9337472073639e-06, "loss": 1.2201, "step": 21211 }, { "epoch": 0.58, "learning_rate": 7.932881795783928e-06, "loss": 1.7139, "step": 21212 }, { "epoch": 0.58, "learning_rate": 7.932016400376125e-06, "loss": 1.072, "step": 21213 }, { "epoch": 0.58, "learning_rate": 7.931151021147245e-06, "loss": 1.2974, "step": 21214 }, { "epoch": 0.58, "learning_rate": 7.930285658104074e-06, "loss": 1.0146, "step": 21215 }, { "epoch": 0.58, "learning_rate": 7.929420311253368e-06, "loss": 1.3652, "step": 21216 }, { "epoch": 0.58, "learning_rate": 7.928554980601906e-06, "loss": 1.4756, "step": 21217 }, { "epoch": 0.58, "learning_rate": 7.927689666156458e-06, "loss": 1.365, "step": 21218 }, { "epoch": 0.58, "learning_rate": 7.92682436792379e-06, "loss": 1.3232, "step": 21219 }, { "epoch": 0.58, "learning_rate": 7.925959085910675e-06, "loss": 1.1882, "step": 21220 }, { "epoch": 0.58, "learning_rate": 7.92509382012388e-06, "loss": 1.3586, "step": 21221 }, { "epoch": 0.58, "learning_rate": 7.924228570570175e-06, "loss": 1.3486, "step": 21222 }, { "epoch": 0.58, "learning_rate": 7.923363337256327e-06, "loss": 1.3608, "step": 21223 }, { "epoch": 0.58, "learning_rate": 7.922498120189112e-06, "loss": 1.3357, "step": 21224 }, { "epoch": 0.58, "learning_rate": 7.921632919375293e-06, "loss": 1.2881, "step": 21225 }, { "epoch": 0.58, "learning_rate": 7.920767734821641e-06, "loss": 1.252, "step": 21226 }, { "epoch": 0.58, "learning_rate": 7.919902566534923e-06, "loss": 1.3523, "step": 21227 }, { "epoch": 0.58, "learning_rate": 7.919037414521912e-06, "loss": 1.3479, "step": 21228 }, { "epoch": 0.58, "learning_rate": 7.918172278789371e-06, "loss": 1.2288, "step": 21229 }, { "epoch": 0.58, "learning_rate": 7.917307159344074e-06, "loss": 1.3728, "step": 21230 }, { "epoch": 0.58, "learning_rate": 7.916442056192783e-06, "loss": 1.1814, "step": 21231 }, { "epoch": 0.58, "learning_rate": 7.91557696934227e-06, "loss": 1.3105, "step": 21232 }, { "epoch": 0.58, "learning_rate": 7.914711898799306e-06, "loss": 1.4629, "step": 21233 }, { "epoch": 0.58, "learning_rate": 7.913846844570652e-06, "loss": 1.3103, "step": 21234 }, { "epoch": 0.58, "learning_rate": 7.91298180666308e-06, "loss": 1.2517, "step": 21235 }, { "epoch": 0.58, "learning_rate": 7.912116785083358e-06, "loss": 1.7812, "step": 21236 }, { "epoch": 0.58, "learning_rate": 7.911251779838253e-06, "loss": 1.1411, "step": 21237 }, { "epoch": 0.58, "learning_rate": 7.91038679093453e-06, "loss": 1.2849, "step": 21238 }, { "epoch": 0.58, "learning_rate": 7.909521818378961e-06, "loss": 1.3894, "step": 21239 }, { "epoch": 0.58, "learning_rate": 7.908656862178307e-06, "loss": 1.313, "step": 21240 }, { "epoch": 0.58, "learning_rate": 7.907791922339343e-06, "loss": 1.3271, "step": 21241 }, { "epoch": 0.58, "learning_rate": 7.906926998868826e-06, "loss": 1.3269, "step": 21242 }, { "epoch": 0.58, "learning_rate": 7.90606209177353e-06, "loss": 1.3401, "step": 21243 }, { "epoch": 0.58, "learning_rate": 7.905197201060218e-06, "loss": 1.1608, "step": 21244 }, { "epoch": 0.58, "learning_rate": 7.904332326735662e-06, "loss": 1.2744, "step": 21245 }, { "epoch": 0.58, "learning_rate": 7.90346746880662e-06, "loss": 1.3296, "step": 21246 }, { "epoch": 0.58, "learning_rate": 7.902602627279861e-06, "loss": 1.3372, "step": 21247 }, { "epoch": 0.58, "learning_rate": 7.90173780216216e-06, "loss": 1.3364, "step": 21248 }, { "epoch": 0.58, "learning_rate": 7.900872993460269e-06, "loss": 1.2312, "step": 21249 }, { "epoch": 0.58, "learning_rate": 7.900008201180968e-06, "loss": 1.271, "step": 21250 }, { "epoch": 0.58, "learning_rate": 7.899143425331008e-06, "loss": 1.291, "step": 21251 }, { "epoch": 0.58, "learning_rate": 7.898278665917168e-06, "loss": 1.373, "step": 21252 }, { "epoch": 0.58, "learning_rate": 7.8974139229462e-06, "loss": 1.1697, "step": 21253 }, { "epoch": 0.58, "learning_rate": 7.896549196424886e-06, "loss": 1.3037, "step": 21254 }, { "epoch": 0.58, "learning_rate": 7.895684486359973e-06, "loss": 1.1523, "step": 21255 }, { "epoch": 0.58, "learning_rate": 7.894819792758244e-06, "loss": 1.262, "step": 21256 }, { "epoch": 0.58, "learning_rate": 7.893955115626446e-06, "loss": 1.2368, "step": 21257 }, { "epoch": 0.58, "learning_rate": 7.89309045497136e-06, "loss": 1.3252, "step": 21258 }, { "epoch": 0.58, "learning_rate": 7.892225810799738e-06, "loss": 1.1359, "step": 21259 }, { "epoch": 0.58, "learning_rate": 7.891361183118356e-06, "loss": 1.1279, "step": 21260 }, { "epoch": 0.58, "learning_rate": 7.890496571933967e-06, "loss": 1.3792, "step": 21261 }, { "epoch": 0.58, "learning_rate": 7.889631977253346e-06, "loss": 1.3386, "step": 21262 }, { "epoch": 0.58, "learning_rate": 7.888767399083245e-06, "loss": 1.2561, "step": 21263 }, { "epoch": 0.58, "learning_rate": 7.88790283743044e-06, "loss": 1.4028, "step": 21264 }, { "epoch": 0.58, "learning_rate": 7.88703829230169e-06, "loss": 1.2285, "step": 21265 }, { "epoch": 0.58, "learning_rate": 7.886173763703757e-06, "loss": 1.2961, "step": 21266 }, { "epoch": 0.58, "learning_rate": 7.885309251643409e-06, "loss": 1.2266, "step": 21267 }, { "epoch": 0.58, "learning_rate": 7.884444756127403e-06, "loss": 1.2739, "step": 21268 }, { "epoch": 0.58, "learning_rate": 7.883580277162511e-06, "loss": 1.2131, "step": 21269 }, { "epoch": 0.58, "learning_rate": 7.882715814755489e-06, "loss": 1.3054, "step": 21270 }, { "epoch": 0.58, "learning_rate": 7.881851368913105e-06, "loss": 1.3037, "step": 21271 }, { "epoch": 0.58, "learning_rate": 7.880986939642118e-06, "loss": 1.2324, "step": 21272 }, { "epoch": 0.58, "learning_rate": 7.880122526949294e-06, "loss": 1.3916, "step": 21273 }, { "epoch": 0.58, "learning_rate": 7.879258130841392e-06, "loss": 1.3162, "step": 21274 }, { "epoch": 0.58, "learning_rate": 7.87839375132518e-06, "loss": 1.2676, "step": 21275 }, { "epoch": 0.58, "learning_rate": 7.877529388407417e-06, "loss": 1.1602, "step": 21276 }, { "epoch": 0.58, "learning_rate": 7.876665042094867e-06, "loss": 1.3125, "step": 21277 }, { "epoch": 0.58, "learning_rate": 7.875800712394289e-06, "loss": 1.1772, "step": 21278 }, { "epoch": 0.58, "learning_rate": 7.874936399312446e-06, "loss": 1.2222, "step": 21279 }, { "epoch": 0.58, "learning_rate": 7.874072102856105e-06, "loss": 1.1914, "step": 21280 }, { "epoch": 0.58, "learning_rate": 7.873207823032022e-06, "loss": 1.3687, "step": 21281 }, { "epoch": 0.58, "learning_rate": 7.872343559846962e-06, "loss": 1.3818, "step": 21282 }, { "epoch": 0.58, "learning_rate": 7.871479313307684e-06, "loss": 1.0828, "step": 21283 }, { "epoch": 0.58, "learning_rate": 7.870615083420954e-06, "loss": 1.3486, "step": 21284 }, { "epoch": 0.58, "learning_rate": 7.869750870193527e-06, "loss": 1.2197, "step": 21285 }, { "epoch": 0.58, "learning_rate": 7.86888667363217e-06, "loss": 1.313, "step": 21286 }, { "epoch": 0.58, "learning_rate": 7.868022493743638e-06, "loss": 1.4424, "step": 21287 }, { "epoch": 0.58, "learning_rate": 7.8671583305347e-06, "loss": 1.2048, "step": 21288 }, { "epoch": 0.58, "learning_rate": 7.866294184012109e-06, "loss": 1.3318, "step": 21289 }, { "epoch": 0.58, "learning_rate": 7.86543005418263e-06, "loss": 1.2415, "step": 21290 }, { "epoch": 0.58, "learning_rate": 7.864565941053023e-06, "loss": 1.3459, "step": 21291 }, { "epoch": 0.58, "learning_rate": 7.863701844630049e-06, "loss": 1.1365, "step": 21292 }, { "epoch": 0.58, "learning_rate": 7.862837764920465e-06, "loss": 1.2007, "step": 21293 }, { "epoch": 0.58, "learning_rate": 7.861973701931031e-06, "loss": 1.291, "step": 21294 }, { "epoch": 0.58, "learning_rate": 7.861109655668516e-06, "loss": 1.3293, "step": 21295 }, { "epoch": 0.58, "learning_rate": 7.860245626139665e-06, "loss": 1.3354, "step": 21296 }, { "epoch": 0.58, "learning_rate": 7.859381613351254e-06, "loss": 1.2637, "step": 21297 }, { "epoch": 0.58, "learning_rate": 7.858517617310029e-06, "loss": 1.2847, "step": 21298 }, { "epoch": 0.58, "learning_rate": 7.85765363802276e-06, "loss": 1.1989, "step": 21299 }, { "epoch": 0.58, "learning_rate": 7.856789675496198e-06, "loss": 1.3389, "step": 21300 }, { "epoch": 0.58, "learning_rate": 7.855925729737108e-06, "loss": 1.2517, "step": 21301 }, { "epoch": 0.58, "learning_rate": 7.855061800752243e-06, "loss": 1.3074, "step": 21302 }, { "epoch": 0.58, "learning_rate": 7.854197888548373e-06, "loss": 1.6343, "step": 21303 }, { "epoch": 0.58, "learning_rate": 7.853333993132241e-06, "loss": 1.3916, "step": 21304 }, { "epoch": 0.58, "learning_rate": 7.852470114510622e-06, "loss": 1.2593, "step": 21305 }, { "epoch": 0.58, "learning_rate": 7.851606252690261e-06, "loss": 1.3198, "step": 21306 }, { "epoch": 0.58, "learning_rate": 7.850742407677929e-06, "loss": 1.1555, "step": 21307 }, { "epoch": 0.58, "learning_rate": 7.84987857948037e-06, "loss": 1.2654, "step": 21308 }, { "epoch": 0.58, "learning_rate": 7.849014768104354e-06, "loss": 1.3271, "step": 21309 }, { "epoch": 0.58, "learning_rate": 7.848150973556636e-06, "loss": 1.2742, "step": 21310 }, { "epoch": 0.58, "learning_rate": 7.84728719584397e-06, "loss": 1.3486, "step": 21311 }, { "epoch": 0.58, "learning_rate": 7.846423434973119e-06, "loss": 1.2207, "step": 21312 }, { "epoch": 0.58, "learning_rate": 7.845559690950838e-06, "loss": 1.2236, "step": 21313 }, { "epoch": 0.58, "learning_rate": 7.844695963783885e-06, "loss": 1.3655, "step": 21314 }, { "epoch": 0.58, "learning_rate": 7.843832253479016e-06, "loss": 1.1975, "step": 21315 }, { "epoch": 0.58, "learning_rate": 7.842968560042992e-06, "loss": 1.3999, "step": 21316 }, { "epoch": 0.58, "learning_rate": 7.842104883482566e-06, "loss": 1.2847, "step": 21317 }, { "epoch": 0.58, "learning_rate": 7.841241223804498e-06, "loss": 1.228, "step": 21318 }, { "epoch": 0.58, "learning_rate": 7.84037758101554e-06, "loss": 1.126, "step": 21319 }, { "epoch": 0.58, "learning_rate": 7.839513955122456e-06, "loss": 1.1703, "step": 21320 }, { "epoch": 0.58, "learning_rate": 7.838650346131997e-06, "loss": 1.3774, "step": 21321 }, { "epoch": 0.58, "learning_rate": 7.837786754050923e-06, "loss": 1.2581, "step": 21322 }, { "epoch": 0.58, "learning_rate": 7.836923178885987e-06, "loss": 1.4595, "step": 21323 }, { "epoch": 0.58, "learning_rate": 7.836059620643948e-06, "loss": 1.1647, "step": 21324 }, { "epoch": 0.58, "learning_rate": 7.835196079331559e-06, "loss": 1.3669, "step": 21325 }, { "epoch": 0.58, "learning_rate": 7.83433255495558e-06, "loss": 1.3391, "step": 21326 }, { "epoch": 0.58, "learning_rate": 7.833469047522766e-06, "loss": 1.3164, "step": 21327 }, { "epoch": 0.58, "learning_rate": 7.832605557039868e-06, "loss": 1.3262, "step": 21328 }, { "epoch": 0.58, "learning_rate": 7.831742083513647e-06, "loss": 1.4265, "step": 21329 }, { "epoch": 0.58, "learning_rate": 7.830878626950855e-06, "loss": 1.0898, "step": 21330 }, { "epoch": 0.58, "learning_rate": 7.83001518735825e-06, "loss": 1.2332, "step": 21331 }, { "epoch": 0.58, "learning_rate": 7.829151764742586e-06, "loss": 1.397, "step": 21332 }, { "epoch": 0.58, "learning_rate": 7.828288359110617e-06, "loss": 1.2274, "step": 21333 }, { "epoch": 0.58, "learning_rate": 7.827424970469098e-06, "loss": 1.241, "step": 21334 }, { "epoch": 0.58, "learning_rate": 7.826561598824786e-06, "loss": 1.1553, "step": 21335 }, { "epoch": 0.58, "learning_rate": 7.825698244184432e-06, "loss": 1.3499, "step": 21336 }, { "epoch": 0.58, "learning_rate": 7.824834906554794e-06, "loss": 1.2749, "step": 21337 }, { "epoch": 0.58, "learning_rate": 7.823971585942625e-06, "loss": 1.3867, "step": 21338 }, { "epoch": 0.58, "learning_rate": 7.823108282354679e-06, "loss": 1.3108, "step": 21339 }, { "epoch": 0.58, "learning_rate": 7.82224499579771e-06, "loss": 1.4023, "step": 21340 }, { "epoch": 0.58, "learning_rate": 7.821381726278467e-06, "loss": 1.3713, "step": 21341 }, { "epoch": 0.58, "learning_rate": 7.820518473803717e-06, "loss": 1.2913, "step": 21342 }, { "epoch": 0.58, "learning_rate": 7.819655238380199e-06, "loss": 1.2715, "step": 21343 }, { "epoch": 0.58, "learning_rate": 7.81879202001468e-06, "loss": 1.2031, "step": 21344 }, { "epoch": 0.58, "learning_rate": 7.8179288187139e-06, "loss": 1.2715, "step": 21345 }, { "epoch": 0.58, "learning_rate": 7.817065634484626e-06, "loss": 1.2695, "step": 21346 }, { "epoch": 0.58, "learning_rate": 7.816202467333597e-06, "loss": 1.3066, "step": 21347 }, { "epoch": 0.58, "learning_rate": 7.815339317267579e-06, "loss": 1.1394, "step": 21348 }, { "epoch": 0.58, "learning_rate": 7.814476184293313e-06, "loss": 1.207, "step": 21349 }, { "epoch": 0.58, "learning_rate": 7.813613068417563e-06, "loss": 1.46, "step": 21350 }, { "epoch": 0.58, "learning_rate": 7.812749969647071e-06, "loss": 1.1807, "step": 21351 }, { "epoch": 0.58, "learning_rate": 7.811886887988599e-06, "loss": 1.3994, "step": 21352 }, { "epoch": 0.58, "learning_rate": 7.811023823448892e-06, "loss": 1.3093, "step": 21353 }, { "epoch": 0.58, "learning_rate": 7.810160776034707e-06, "loss": 1.3577, "step": 21354 }, { "epoch": 0.58, "learning_rate": 7.809297745752793e-06, "loss": 1.7759, "step": 21355 }, { "epoch": 0.58, "learning_rate": 7.808434732609903e-06, "loss": 1.2356, "step": 21356 }, { "epoch": 0.58, "learning_rate": 7.807571736612792e-06, "loss": 1.2834, "step": 21357 }, { "epoch": 0.58, "learning_rate": 7.806708757768207e-06, "loss": 1.4097, "step": 21358 }, { "epoch": 0.58, "learning_rate": 7.805845796082903e-06, "loss": 1.323, "step": 21359 }, { "epoch": 0.58, "learning_rate": 7.804982851563626e-06, "loss": 1.3125, "step": 21360 }, { "epoch": 0.58, "learning_rate": 7.804119924217135e-06, "loss": 1.2627, "step": 21361 }, { "epoch": 0.58, "learning_rate": 7.803257014050174e-06, "loss": 1.0703, "step": 21362 }, { "epoch": 0.58, "learning_rate": 7.8023941210695e-06, "loss": 1.249, "step": 21363 }, { "epoch": 0.58, "learning_rate": 7.801531245281859e-06, "loss": 1.3662, "step": 21364 }, { "epoch": 0.58, "learning_rate": 7.800668386694005e-06, "loss": 1.1624, "step": 21365 }, { "epoch": 0.58, "learning_rate": 7.799805545312686e-06, "loss": 1.1655, "step": 21366 }, { "epoch": 0.58, "learning_rate": 7.798942721144655e-06, "loss": 1.3203, "step": 21367 }, { "epoch": 0.58, "learning_rate": 7.79807991419666e-06, "loss": 1.3528, "step": 21368 }, { "epoch": 0.58, "learning_rate": 7.797217124475454e-06, "loss": 1.2971, "step": 21369 }, { "epoch": 0.58, "learning_rate": 7.796354351987783e-06, "loss": 1.4031, "step": 21370 }, { "epoch": 0.58, "learning_rate": 7.7954915967404e-06, "loss": 1.3638, "step": 21371 }, { "epoch": 0.58, "learning_rate": 7.794628858740057e-06, "loss": 1.3372, "step": 21372 }, { "epoch": 0.58, "learning_rate": 7.793766137993497e-06, "loss": 1.2109, "step": 21373 }, { "epoch": 0.58, "learning_rate": 7.792903434507474e-06, "loss": 1.3271, "step": 21374 }, { "epoch": 0.58, "learning_rate": 7.792040748288738e-06, "loss": 1.3469, "step": 21375 }, { "epoch": 0.58, "learning_rate": 7.791178079344037e-06, "loss": 1.2853, "step": 21376 }, { "epoch": 0.58, "learning_rate": 7.79031542768012e-06, "loss": 1.1776, "step": 21377 }, { "epoch": 0.58, "learning_rate": 7.789452793303736e-06, "loss": 1.1995, "step": 21378 }, { "epoch": 0.58, "learning_rate": 7.788590176221631e-06, "loss": 1.3394, "step": 21379 }, { "epoch": 0.58, "learning_rate": 7.787727576440561e-06, "loss": 1.2505, "step": 21380 }, { "epoch": 0.58, "learning_rate": 7.786864993967266e-06, "loss": 1.2795, "step": 21381 }, { "epoch": 0.58, "learning_rate": 7.786002428808504e-06, "loss": 1.2983, "step": 21382 }, { "epoch": 0.58, "learning_rate": 7.785139880971014e-06, "loss": 1.1306, "step": 21383 }, { "epoch": 0.58, "learning_rate": 7.784277350461549e-06, "loss": 1.3313, "step": 21384 }, { "epoch": 0.58, "learning_rate": 7.783414837286853e-06, "loss": 1.3032, "step": 21385 }, { "epoch": 0.58, "learning_rate": 7.782552341453683e-06, "loss": 1.3206, "step": 21386 }, { "epoch": 0.58, "learning_rate": 7.781689862968775e-06, "loss": 1.3752, "step": 21387 }, { "epoch": 0.58, "learning_rate": 7.780827401838884e-06, "loss": 1.2944, "step": 21388 }, { "epoch": 0.58, "learning_rate": 7.779964958070757e-06, "loss": 1.6753, "step": 21389 }, { "epoch": 0.58, "learning_rate": 7.77910253167114e-06, "loss": 1.2737, "step": 21390 }, { "epoch": 0.58, "learning_rate": 7.77824012264678e-06, "loss": 1.3047, "step": 21391 }, { "epoch": 0.58, "learning_rate": 7.777377731004426e-06, "loss": 1.438, "step": 21392 }, { "epoch": 0.58, "learning_rate": 7.776515356750823e-06, "loss": 1.4583, "step": 21393 }, { "epoch": 0.58, "learning_rate": 7.775652999892717e-06, "loss": 1.3264, "step": 21394 }, { "epoch": 0.58, "learning_rate": 7.774790660436857e-06, "loss": 1.3599, "step": 21395 }, { "epoch": 0.58, "learning_rate": 7.773928338389988e-06, "loss": 1.2866, "step": 21396 }, { "epoch": 0.58, "learning_rate": 7.773066033758858e-06, "loss": 1.2981, "step": 21397 }, { "epoch": 0.58, "learning_rate": 7.772203746550211e-06, "loss": 1.2034, "step": 21398 }, { "epoch": 0.58, "learning_rate": 7.771341476770795e-06, "loss": 1.3423, "step": 21399 }, { "epoch": 0.58, "learning_rate": 7.770479224427355e-06, "loss": 1.332, "step": 21400 }, { "epoch": 0.58, "learning_rate": 7.769616989526637e-06, "loss": 1.2673, "step": 21401 }, { "epoch": 0.58, "learning_rate": 7.768754772075387e-06, "loss": 1.2156, "step": 21402 }, { "epoch": 0.58, "learning_rate": 7.767892572080349e-06, "loss": 1.1443, "step": 21403 }, { "epoch": 0.58, "learning_rate": 7.767030389548273e-06, "loss": 1.2786, "step": 21404 }, { "epoch": 0.58, "learning_rate": 7.766168224485899e-06, "loss": 1.229, "step": 21405 }, { "epoch": 0.58, "learning_rate": 7.765306076899976e-06, "loss": 1.1968, "step": 21406 }, { "epoch": 0.58, "learning_rate": 7.764443946797244e-06, "loss": 1.1182, "step": 21407 }, { "epoch": 0.58, "learning_rate": 7.763581834184456e-06, "loss": 1.3811, "step": 21408 }, { "epoch": 0.58, "learning_rate": 7.762719739068349e-06, "loss": 1.2888, "step": 21409 }, { "epoch": 0.58, "learning_rate": 7.761857661455672e-06, "loss": 1.3452, "step": 21410 }, { "epoch": 0.58, "learning_rate": 7.760995601353167e-06, "loss": 1.4707, "step": 21411 }, { "epoch": 0.58, "learning_rate": 7.760133558767582e-06, "loss": 1.3237, "step": 21412 }, { "epoch": 0.58, "learning_rate": 7.759271533705656e-06, "loss": 1.0718, "step": 21413 }, { "epoch": 0.58, "learning_rate": 7.758409526174137e-06, "loss": 1.4163, "step": 21414 }, { "epoch": 0.58, "learning_rate": 7.757547536179769e-06, "loss": 1.2476, "step": 21415 }, { "epoch": 0.58, "learning_rate": 7.756685563729292e-06, "loss": 1.1208, "step": 21416 }, { "epoch": 0.58, "learning_rate": 7.755823608829453e-06, "loss": 1.3313, "step": 21417 }, { "epoch": 0.58, "learning_rate": 7.754961671486993e-06, "loss": 1.2876, "step": 21418 }, { "epoch": 0.58, "learning_rate": 7.754099751708662e-06, "loss": 1.2961, "step": 21419 }, { "epoch": 0.58, "learning_rate": 7.753237849501195e-06, "loss": 1.1858, "step": 21420 }, { "epoch": 0.58, "learning_rate": 7.752375964871341e-06, "loss": 1.2466, "step": 21421 }, { "epoch": 0.59, "learning_rate": 7.751514097825836e-06, "loss": 1.1672, "step": 21422 }, { "epoch": 0.59, "learning_rate": 7.750652248371435e-06, "loss": 1.3091, "step": 21423 }, { "epoch": 0.59, "learning_rate": 7.749790416514865e-06, "loss": 1.355, "step": 21424 }, { "epoch": 0.59, "learning_rate": 7.748928602262883e-06, "loss": 1.1606, "step": 21425 }, { "epoch": 0.59, "learning_rate": 7.74806680562222e-06, "loss": 1.4111, "step": 21426 }, { "epoch": 0.59, "learning_rate": 7.74720502659963e-06, "loss": 1.2314, "step": 21427 }, { "epoch": 0.59, "learning_rate": 7.74634326520184e-06, "loss": 1.2708, "step": 21428 }, { "epoch": 0.59, "learning_rate": 7.745481521435609e-06, "loss": 1.1697, "step": 21429 }, { "epoch": 0.59, "learning_rate": 7.744619795307661e-06, "loss": 1.1775, "step": 21430 }, { "epoch": 0.59, "learning_rate": 7.743758086824757e-06, "loss": 1.2539, "step": 21431 }, { "epoch": 0.59, "learning_rate": 7.742896395993621e-06, "loss": 1.397, "step": 21432 }, { "epoch": 0.59, "learning_rate": 7.742034722821005e-06, "loss": 1.2615, "step": 21433 }, { "epoch": 0.59, "learning_rate": 7.741173067313648e-06, "loss": 1.2844, "step": 21434 }, { "epoch": 0.59, "learning_rate": 7.74031142947829e-06, "loss": 1.1167, "step": 21435 }, { "epoch": 0.59, "learning_rate": 7.739449809321675e-06, "loss": 1.3354, "step": 21436 }, { "epoch": 0.59, "learning_rate": 7.73858820685054e-06, "loss": 1.0376, "step": 21437 }, { "epoch": 0.59, "learning_rate": 7.737726622071628e-06, "loss": 1.3062, "step": 21438 }, { "epoch": 0.59, "learning_rate": 7.736865054991677e-06, "loss": 1.1035, "step": 21439 }, { "epoch": 0.59, "learning_rate": 7.736003505617432e-06, "loss": 1.342, "step": 21440 }, { "epoch": 0.59, "learning_rate": 7.73514197395563e-06, "loss": 1.2351, "step": 21441 }, { "epoch": 0.59, "learning_rate": 7.734280460013014e-06, "loss": 1.1484, "step": 21442 }, { "epoch": 0.59, "learning_rate": 7.733418963796321e-06, "loss": 1.2087, "step": 21443 }, { "epoch": 0.59, "learning_rate": 7.732557485312293e-06, "loss": 1.1736, "step": 21444 }, { "epoch": 0.59, "learning_rate": 7.731696024567667e-06, "loss": 1.2583, "step": 21445 }, { "epoch": 0.59, "learning_rate": 7.730834581569186e-06, "loss": 1.3347, "step": 21446 }, { "epoch": 0.59, "learning_rate": 7.729973156323588e-06, "loss": 1.2393, "step": 21447 }, { "epoch": 0.59, "learning_rate": 7.729111748837614e-06, "loss": 1.25, "step": 21448 }, { "epoch": 0.59, "learning_rate": 7.728250359117999e-06, "loss": 1.4219, "step": 21449 }, { "epoch": 0.59, "learning_rate": 7.727388987171486e-06, "loss": 1.2715, "step": 21450 }, { "epoch": 0.59, "learning_rate": 7.726527633004815e-06, "loss": 1.8032, "step": 21451 }, { "epoch": 0.59, "learning_rate": 7.725666296624719e-06, "loss": 1.3513, "step": 21452 }, { "epoch": 0.59, "learning_rate": 7.724804978037943e-06, "loss": 1.3298, "step": 21453 }, { "epoch": 0.59, "learning_rate": 7.723943677251222e-06, "loss": 1.2454, "step": 21454 }, { "epoch": 0.59, "learning_rate": 7.723082394271295e-06, "loss": 1.3794, "step": 21455 }, { "epoch": 0.59, "learning_rate": 7.722221129104902e-06, "loss": 1.3076, "step": 21456 }, { "epoch": 0.59, "learning_rate": 7.72135988175878e-06, "loss": 1.3628, "step": 21457 }, { "epoch": 0.59, "learning_rate": 7.720498652239665e-06, "loss": 1.3264, "step": 21458 }, { "epoch": 0.59, "learning_rate": 7.7196374405543e-06, "loss": 1.1792, "step": 21459 }, { "epoch": 0.59, "learning_rate": 7.718776246709416e-06, "loss": 1.2905, "step": 21460 }, { "epoch": 0.59, "learning_rate": 7.717915070711756e-06, "loss": 1.2532, "step": 21461 }, { "epoch": 0.59, "learning_rate": 7.717053912568053e-06, "loss": 1.1042, "step": 21462 }, { "epoch": 0.59, "learning_rate": 7.71619277228505e-06, "loss": 1.4404, "step": 21463 }, { "epoch": 0.59, "learning_rate": 7.715331649869476e-06, "loss": 1.3452, "step": 21464 }, { "epoch": 0.59, "learning_rate": 7.714470545328073e-06, "loss": 1.303, "step": 21465 }, { "epoch": 0.59, "learning_rate": 7.713609458667583e-06, "loss": 1.2598, "step": 21466 }, { "epoch": 0.59, "learning_rate": 7.712748389894734e-06, "loss": 1.3616, "step": 21467 }, { "epoch": 0.59, "learning_rate": 7.711887339016268e-06, "loss": 1.1541, "step": 21468 }, { "epoch": 0.59, "learning_rate": 7.711026306038915e-06, "loss": 1.2646, "step": 21469 }, { "epoch": 0.59, "learning_rate": 7.710165290969423e-06, "loss": 1.3125, "step": 21470 }, { "epoch": 0.59, "learning_rate": 7.709304293814515e-06, "loss": 1.1462, "step": 21471 }, { "epoch": 0.59, "learning_rate": 7.708443314580938e-06, "loss": 1.3369, "step": 21472 }, { "epoch": 0.59, "learning_rate": 7.707582353275417e-06, "loss": 1.1812, "step": 21473 }, { "epoch": 0.59, "learning_rate": 7.706721409904701e-06, "loss": 1.4114, "step": 21474 }, { "epoch": 0.59, "learning_rate": 7.705860484475511e-06, "loss": 1.2041, "step": 21475 }, { "epoch": 0.59, "learning_rate": 7.704999576994595e-06, "loss": 1.3833, "step": 21476 }, { "epoch": 0.59, "learning_rate": 7.70413868746868e-06, "loss": 1.1899, "step": 21477 }, { "epoch": 0.59, "learning_rate": 7.703277815904508e-06, "loss": 1.2708, "step": 21478 }, { "epoch": 0.59, "learning_rate": 7.702416962308805e-06, "loss": 1.2278, "step": 21479 }, { "epoch": 0.59, "learning_rate": 7.701556126688313e-06, "loss": 1.2334, "step": 21480 }, { "epoch": 0.59, "learning_rate": 7.700695309049768e-06, "loss": 1.4446, "step": 21481 }, { "epoch": 0.59, "learning_rate": 7.699834509399899e-06, "loss": 1.4414, "step": 21482 }, { "epoch": 0.59, "learning_rate": 7.698973727745444e-06, "loss": 1.2446, "step": 21483 }, { "epoch": 0.59, "learning_rate": 7.698112964093136e-06, "loss": 1.3677, "step": 21484 }, { "epoch": 0.59, "learning_rate": 7.697252218449711e-06, "loss": 1.1946, "step": 21485 }, { "epoch": 0.59, "learning_rate": 7.696391490821901e-06, "loss": 1.3066, "step": 21486 }, { "epoch": 0.59, "learning_rate": 7.695530781216442e-06, "loss": 1.3611, "step": 21487 }, { "epoch": 0.59, "learning_rate": 7.694670089640064e-06, "loss": 1.1504, "step": 21488 }, { "epoch": 0.59, "learning_rate": 7.693809416099506e-06, "loss": 1.2222, "step": 21489 }, { "epoch": 0.59, "learning_rate": 7.692948760601497e-06, "loss": 1.3179, "step": 21490 }, { "epoch": 0.59, "learning_rate": 7.692088123152774e-06, "loss": 1.3535, "step": 21491 }, { "epoch": 0.59, "learning_rate": 7.691227503760064e-06, "loss": 1.5122, "step": 21492 }, { "epoch": 0.59, "learning_rate": 7.690366902430109e-06, "loss": 1.3308, "step": 21493 }, { "epoch": 0.59, "learning_rate": 7.689506319169634e-06, "loss": 1.113, "step": 21494 }, { "epoch": 0.59, "learning_rate": 7.688645753985376e-06, "loss": 1.3618, "step": 21495 }, { "epoch": 0.59, "learning_rate": 7.687785206884067e-06, "loss": 1.3696, "step": 21496 }, { "epoch": 0.59, "learning_rate": 7.68692467787244e-06, "loss": 1.7124, "step": 21497 }, { "epoch": 0.59, "learning_rate": 7.686064166957227e-06, "loss": 1.1919, "step": 21498 }, { "epoch": 0.59, "learning_rate": 7.685203674145158e-06, "loss": 1.4077, "step": 21499 }, { "epoch": 0.59, "learning_rate": 7.684343199442969e-06, "loss": 1.2876, "step": 21500 }, { "epoch": 0.59, "learning_rate": 7.683482742857386e-06, "loss": 1.2534, "step": 21501 }, { "epoch": 0.59, "learning_rate": 7.68262230439515e-06, "loss": 1.3813, "step": 21502 }, { "epoch": 0.59, "learning_rate": 7.681761884062983e-06, "loss": 1.2786, "step": 21503 }, { "epoch": 0.59, "learning_rate": 7.680901481867624e-06, "loss": 1.2288, "step": 21504 }, { "epoch": 0.59, "learning_rate": 7.6800410978158e-06, "loss": 1.3125, "step": 21505 }, { "epoch": 0.59, "learning_rate": 7.679180731914244e-06, "loss": 1.3113, "step": 21506 }, { "epoch": 0.59, "learning_rate": 7.678320384169684e-06, "loss": 1.2095, "step": 21507 }, { "epoch": 0.59, "learning_rate": 7.677460054588859e-06, "loss": 1.2336, "step": 21508 }, { "epoch": 0.59, "learning_rate": 7.67659974317849e-06, "loss": 1.3235, "step": 21509 }, { "epoch": 0.59, "learning_rate": 7.675739449945314e-06, "loss": 1.2896, "step": 21510 }, { "epoch": 0.59, "learning_rate": 7.674879174896057e-06, "loss": 1.0247, "step": 21511 }, { "epoch": 0.59, "learning_rate": 7.674018918037451e-06, "loss": 1.4097, "step": 21512 }, { "epoch": 0.59, "learning_rate": 7.673158679376233e-06, "loss": 1.1182, "step": 21513 }, { "epoch": 0.59, "learning_rate": 7.672298458919123e-06, "loss": 1.769, "step": 21514 }, { "epoch": 0.59, "learning_rate": 7.671438256672858e-06, "loss": 1.2964, "step": 21515 }, { "epoch": 0.59, "learning_rate": 7.670578072644162e-06, "loss": 1.687, "step": 21516 }, { "epoch": 0.59, "learning_rate": 7.669717906839774e-06, "loss": 1.3677, "step": 21517 }, { "epoch": 0.59, "learning_rate": 7.668857759266408e-06, "loss": 1.3115, "step": 21518 }, { "epoch": 0.59, "learning_rate": 7.667997629930812e-06, "loss": 1.2073, "step": 21519 }, { "epoch": 0.59, "learning_rate": 7.667137518839697e-06, "loss": 1.3354, "step": 21520 }, { "epoch": 0.59, "learning_rate": 7.66627742599981e-06, "loss": 1.1079, "step": 21521 }, { "epoch": 0.59, "learning_rate": 7.665417351417864e-06, "loss": 1.6582, "step": 21522 }, { "epoch": 0.59, "learning_rate": 7.6645572951006e-06, "loss": 1.1443, "step": 21523 }, { "epoch": 0.59, "learning_rate": 7.663697257054736e-06, "loss": 1.2021, "step": 21524 }, { "epoch": 0.59, "learning_rate": 7.662837237287014e-06, "loss": 1.2595, "step": 21525 }, { "epoch": 0.59, "learning_rate": 7.661977235804144e-06, "loss": 1.1445, "step": 21526 }, { "epoch": 0.59, "learning_rate": 7.66111725261287e-06, "loss": 1.2585, "step": 21527 }, { "epoch": 0.59, "learning_rate": 7.660257287719917e-06, "loss": 1.2627, "step": 21528 }, { "epoch": 0.59, "learning_rate": 7.659397341132006e-06, "loss": 1.3396, "step": 21529 }, { "epoch": 0.59, "learning_rate": 7.658537412855874e-06, "loss": 1.3845, "step": 21530 }, { "epoch": 0.59, "learning_rate": 7.657677502898241e-06, "loss": 1.3098, "step": 21531 }, { "epoch": 0.59, "learning_rate": 7.656817611265842e-06, "loss": 1.145, "step": 21532 }, { "epoch": 0.59, "learning_rate": 7.655957737965395e-06, "loss": 1.5098, "step": 21533 }, { "epoch": 0.59, "learning_rate": 7.655097883003637e-06, "loss": 1.3596, "step": 21534 }, { "epoch": 0.59, "learning_rate": 7.654238046387288e-06, "loss": 1.2188, "step": 21535 }, { "epoch": 0.59, "learning_rate": 7.653378228123078e-06, "loss": 1.2502, "step": 21536 }, { "epoch": 0.59, "learning_rate": 7.652518428217733e-06, "loss": 1.3472, "step": 21537 }, { "epoch": 0.59, "learning_rate": 7.651658646677981e-06, "loss": 1.3418, "step": 21538 }, { "epoch": 0.59, "learning_rate": 7.650798883510546e-06, "loss": 1.3081, "step": 21539 }, { "epoch": 0.59, "learning_rate": 7.649939138722158e-06, "loss": 1.1572, "step": 21540 }, { "epoch": 0.59, "learning_rate": 7.649079412319539e-06, "loss": 1.2476, "step": 21541 }, { "epoch": 0.59, "learning_rate": 7.648219704309416e-06, "loss": 1.2495, "step": 21542 }, { "epoch": 0.59, "learning_rate": 7.64736001469852e-06, "loss": 1.3506, "step": 21543 }, { "epoch": 0.59, "learning_rate": 7.64650034349357e-06, "loss": 1.2288, "step": 21544 }, { "epoch": 0.59, "learning_rate": 7.645640690701295e-06, "loss": 1.2715, "step": 21545 }, { "epoch": 0.59, "learning_rate": 7.644781056328421e-06, "loss": 1.2161, "step": 21546 }, { "epoch": 0.59, "learning_rate": 7.643921440381673e-06, "loss": 1.3994, "step": 21547 }, { "epoch": 0.59, "learning_rate": 7.643061842867774e-06, "loss": 1.4529, "step": 21548 }, { "epoch": 0.59, "learning_rate": 7.642202263793453e-06, "loss": 1.3374, "step": 21549 }, { "epoch": 0.59, "learning_rate": 7.64134270316543e-06, "loss": 1.3828, "step": 21550 }, { "epoch": 0.59, "learning_rate": 7.640483160990435e-06, "loss": 1.1455, "step": 21551 }, { "epoch": 0.59, "learning_rate": 7.639623637275189e-06, "loss": 1.3064, "step": 21552 }, { "epoch": 0.59, "learning_rate": 7.63876413202642e-06, "loss": 1.1785, "step": 21553 }, { "epoch": 0.59, "learning_rate": 7.637904645250847e-06, "loss": 1.3455, "step": 21554 }, { "epoch": 0.59, "learning_rate": 7.6370451769552e-06, "loss": 1.687, "step": 21555 }, { "epoch": 0.59, "learning_rate": 7.636185727146196e-06, "loss": 1.3667, "step": 21556 }, { "epoch": 0.59, "learning_rate": 7.635326295830566e-06, "loss": 1.4094, "step": 21557 }, { "epoch": 0.59, "learning_rate": 7.634466883015032e-06, "loss": 1.3394, "step": 21558 }, { "epoch": 0.59, "learning_rate": 7.633607488706315e-06, "loss": 1.2544, "step": 21559 }, { "epoch": 0.59, "learning_rate": 7.632748112911144e-06, "loss": 1.3027, "step": 21560 }, { "epoch": 0.59, "learning_rate": 7.631888755636232e-06, "loss": 1.1726, "step": 21561 }, { "epoch": 0.59, "learning_rate": 7.631029416888317e-06, "loss": 1.2808, "step": 21562 }, { "epoch": 0.59, "learning_rate": 7.630170096674106e-06, "loss": 1.1597, "step": 21563 }, { "epoch": 0.59, "learning_rate": 7.629310795000337e-06, "loss": 1.2302, "step": 21564 }, { "epoch": 0.59, "learning_rate": 7.6284515118737194e-06, "loss": 1.1448, "step": 21565 }, { "epoch": 0.59, "learning_rate": 7.627592247300988e-06, "loss": 1.3132, "step": 21566 }, { "epoch": 0.59, "learning_rate": 7.626733001288852e-06, "loss": 1.3623, "step": 21567 }, { "epoch": 0.59, "learning_rate": 7.625873773844048e-06, "loss": 1.1133, "step": 21568 }, { "epoch": 0.59, "learning_rate": 7.6250145649732855e-06, "loss": 1.2207, "step": 21569 }, { "epoch": 0.59, "learning_rate": 7.624155374683297e-06, "loss": 1.3076, "step": 21570 }, { "epoch": 0.59, "learning_rate": 7.623296202980795e-06, "loss": 1.2017, "step": 21571 }, { "epoch": 0.59, "learning_rate": 7.622437049872512e-06, "loss": 1.2927, "step": 21572 }, { "epoch": 0.59, "learning_rate": 7.621577915365157e-06, "loss": 1.3325, "step": 21573 }, { "epoch": 0.59, "learning_rate": 7.62071879946546e-06, "loss": 1.3173, "step": 21574 }, { "epoch": 0.59, "learning_rate": 7.619859702180141e-06, "loss": 1.3569, "step": 21575 }, { "epoch": 0.59, "learning_rate": 7.61900062351592e-06, "loss": 1.1821, "step": 21576 }, { "epoch": 0.59, "learning_rate": 7.618141563479521e-06, "loss": 1.2222, "step": 21577 }, { "epoch": 0.59, "learning_rate": 7.617282522077659e-06, "loss": 1.2742, "step": 21578 }, { "epoch": 0.59, "learning_rate": 7.616423499317061e-06, "loss": 1.3586, "step": 21579 }, { "epoch": 0.59, "learning_rate": 7.615564495204442e-06, "loss": 1.3298, "step": 21580 }, { "epoch": 0.59, "learning_rate": 7.614705509746527e-06, "loss": 1.2212, "step": 21581 }, { "epoch": 0.59, "learning_rate": 7.613846542950034e-06, "loss": 1.2668, "step": 21582 }, { "epoch": 0.59, "learning_rate": 7.612987594821685e-06, "loss": 1.3037, "step": 21583 }, { "epoch": 0.59, "learning_rate": 7.6121286653681955e-06, "loss": 1.313, "step": 21584 }, { "epoch": 0.59, "learning_rate": 7.611269754596291e-06, "loss": 1.2969, "step": 21585 }, { "epoch": 0.59, "learning_rate": 7.610410862512687e-06, "loss": 1.1592, "step": 21586 }, { "epoch": 0.59, "learning_rate": 7.609551989124107e-06, "loss": 1.325, "step": 21587 }, { "epoch": 0.59, "learning_rate": 7.608693134437265e-06, "loss": 1.2292, "step": 21588 }, { "epoch": 0.59, "learning_rate": 7.607834298458885e-06, "loss": 1.2051, "step": 21589 }, { "epoch": 0.59, "learning_rate": 7.6069754811956854e-06, "loss": 1.1721, "step": 21590 }, { "epoch": 0.59, "learning_rate": 7.606116682654383e-06, "loss": 1.3418, "step": 21591 }, { "epoch": 0.59, "learning_rate": 7.6052579028417e-06, "loss": 1.3486, "step": 21592 }, { "epoch": 0.59, "learning_rate": 7.60439914176435e-06, "loss": 1.2446, "step": 21593 }, { "epoch": 0.59, "learning_rate": 7.603540399429058e-06, "loss": 1.4055, "step": 21594 }, { "epoch": 0.59, "learning_rate": 7.602681675842536e-06, "loss": 1.2588, "step": 21595 }, { "epoch": 0.59, "learning_rate": 7.601822971011508e-06, "loss": 1.3701, "step": 21596 }, { "epoch": 0.59, "learning_rate": 7.600964284942687e-06, "loss": 1.0613, "step": 21597 }, { "epoch": 0.59, "learning_rate": 7.600105617642795e-06, "loss": 1.2542, "step": 21598 }, { "epoch": 0.59, "learning_rate": 7.599246969118547e-06, "loss": 1.2202, "step": 21599 }, { "epoch": 0.59, "learning_rate": 7.598388339376663e-06, "loss": 1.1567, "step": 21600 }, { "epoch": 0.59, "learning_rate": 7.597529728423858e-06, "loss": 1.2107, "step": 21601 }, { "epoch": 0.59, "learning_rate": 7.596671136266852e-06, "loss": 1.168, "step": 21602 }, { "epoch": 0.59, "learning_rate": 7.595812562912359e-06, "loss": 1.4377, "step": 21603 }, { "epoch": 0.59, "learning_rate": 7.594954008367097e-06, "loss": 1.2085, "step": 21604 }, { "epoch": 0.59, "learning_rate": 7.594095472637789e-06, "loss": 1.3884, "step": 21605 }, { "epoch": 0.59, "learning_rate": 7.59323695573114e-06, "loss": 1.355, "step": 21606 }, { "epoch": 0.59, "learning_rate": 7.592378457653882e-06, "loss": 1.2017, "step": 21607 }, { "epoch": 0.59, "learning_rate": 7.591519978412714e-06, "loss": 1.2178, "step": 21608 }, { "epoch": 0.59, "learning_rate": 7.590661518014369e-06, "loss": 1.2485, "step": 21609 }, { "epoch": 0.59, "learning_rate": 7.589803076465547e-06, "loss": 1.2007, "step": 21610 }, { "epoch": 0.59, "learning_rate": 7.588944653772981e-06, "loss": 1.3838, "step": 21611 }, { "epoch": 0.59, "learning_rate": 7.588086249943371e-06, "loss": 1.1497, "step": 21612 }, { "epoch": 0.59, "learning_rate": 7.587227864983446e-06, "loss": 1.3, "step": 21613 }, { "epoch": 0.59, "learning_rate": 7.586369498899909e-06, "loss": 1.1709, "step": 21614 }, { "epoch": 0.59, "learning_rate": 7.585511151699487e-06, "loss": 1.3809, "step": 21615 }, { "epoch": 0.59, "learning_rate": 7.584652823388888e-06, "loss": 1.2395, "step": 21616 }, { "epoch": 0.59, "learning_rate": 7.583794513974832e-06, "loss": 1.1277, "step": 21617 }, { "epoch": 0.59, "learning_rate": 7.582936223464029e-06, "loss": 1.2451, "step": 21618 }, { "epoch": 0.59, "learning_rate": 7.582077951863197e-06, "loss": 1.3389, "step": 21619 }, { "epoch": 0.59, "learning_rate": 7.581219699179052e-06, "loss": 1.2905, "step": 21620 }, { "epoch": 0.59, "learning_rate": 7.5803614654183044e-06, "loss": 1.2534, "step": 21621 }, { "epoch": 0.59, "learning_rate": 7.579503250587672e-06, "loss": 1.2651, "step": 21622 }, { "epoch": 0.59, "learning_rate": 7.578645054693867e-06, "loss": 1.3135, "step": 21623 }, { "epoch": 0.59, "learning_rate": 7.577786877743607e-06, "loss": 1.3013, "step": 21624 }, { "epoch": 0.59, "learning_rate": 7.5769287197436e-06, "loss": 1.2764, "step": 21625 }, { "epoch": 0.59, "learning_rate": 7.576070580700567e-06, "loss": 1.3091, "step": 21626 }, { "epoch": 0.59, "learning_rate": 7.5752124606212155e-06, "loss": 1.2581, "step": 21627 }, { "epoch": 0.59, "learning_rate": 7.574354359512263e-06, "loss": 1.3838, "step": 21628 }, { "epoch": 0.59, "learning_rate": 7.573496277380419e-06, "loss": 1.3479, "step": 21629 }, { "epoch": 0.59, "learning_rate": 7.572638214232401e-06, "loss": 1.3159, "step": 21630 }, { "epoch": 0.59, "learning_rate": 7.571780170074919e-06, "loss": 1.2515, "step": 21631 }, { "epoch": 0.59, "learning_rate": 7.570922144914689e-06, "loss": 1.3311, "step": 21632 }, { "epoch": 0.59, "learning_rate": 7.5700641387584205e-06, "loss": 1.2349, "step": 21633 }, { "epoch": 0.59, "learning_rate": 7.569206151612829e-06, "loss": 1.2478, "step": 21634 }, { "epoch": 0.59, "learning_rate": 7.568348183484623e-06, "loss": 1.1929, "step": 21635 }, { "epoch": 0.59, "learning_rate": 7.567490234380518e-06, "loss": 1.1787, "step": 21636 }, { "epoch": 0.59, "learning_rate": 7.5666323043072265e-06, "loss": 1.3625, "step": 21637 }, { "epoch": 0.59, "learning_rate": 7.565774393271459e-06, "loss": 1.2498, "step": 21638 }, { "epoch": 0.59, "learning_rate": 7.56491650127993e-06, "loss": 1.2446, "step": 21639 }, { "epoch": 0.59, "learning_rate": 7.5640586283393455e-06, "loss": 1.2219, "step": 21640 }, { "epoch": 0.59, "learning_rate": 7.563200774456425e-06, "loss": 1.3323, "step": 21641 }, { "epoch": 0.59, "learning_rate": 7.562342939637872e-06, "loss": 1.2117, "step": 21642 }, { "epoch": 0.59, "learning_rate": 7.561485123890404e-06, "loss": 1.2629, "step": 21643 }, { "epoch": 0.59, "learning_rate": 7.560627327220729e-06, "loss": 1.2058, "step": 21644 }, { "epoch": 0.59, "learning_rate": 7.55976954963556e-06, "loss": 1.427, "step": 21645 }, { "epoch": 0.59, "learning_rate": 7.5589117911416034e-06, "loss": 1.3313, "step": 21646 }, { "epoch": 0.59, "learning_rate": 7.558054051745576e-06, "loss": 1.3232, "step": 21647 }, { "epoch": 0.59, "learning_rate": 7.557196331454182e-06, "loss": 1.2935, "step": 21648 }, { "epoch": 0.59, "learning_rate": 7.55633863027414e-06, "loss": 1.2192, "step": 21649 }, { "epoch": 0.59, "learning_rate": 7.55548094821215e-06, "loss": 1.374, "step": 21650 }, { "epoch": 0.59, "learning_rate": 7.55462328527493e-06, "loss": 1.4153, "step": 21651 }, { "epoch": 0.59, "learning_rate": 7.55376564146919e-06, "loss": 1.2583, "step": 21652 }, { "epoch": 0.59, "learning_rate": 7.552908016801633e-06, "loss": 1.4028, "step": 21653 }, { "epoch": 0.59, "learning_rate": 7.552050411278977e-06, "loss": 1.241, "step": 21654 }, { "epoch": 0.59, "learning_rate": 7.5511928249079245e-06, "loss": 1.2374, "step": 21655 }, { "epoch": 0.59, "learning_rate": 7.550335257695192e-06, "loss": 1.2473, "step": 21656 }, { "epoch": 0.59, "learning_rate": 7.549477709647479e-06, "loss": 1.3306, "step": 21657 }, { "epoch": 0.59, "learning_rate": 7.548620180771505e-06, "loss": 1.2483, "step": 21658 }, { "epoch": 0.59, "learning_rate": 7.54776267107397e-06, "loss": 1.3291, "step": 21659 }, { "epoch": 0.59, "learning_rate": 7.54690518056159e-06, "loss": 1.2546, "step": 21660 }, { "epoch": 0.59, "learning_rate": 7.546047709241068e-06, "loss": 1.2852, "step": 21661 }, { "epoch": 0.59, "learning_rate": 7.545190257119117e-06, "loss": 1.1458, "step": 21662 }, { "epoch": 0.59, "learning_rate": 7.5443328242024404e-06, "loss": 1.2576, "step": 21663 }, { "epoch": 0.59, "learning_rate": 7.5434754104977515e-06, "loss": 1.3025, "step": 21664 }, { "epoch": 0.59, "learning_rate": 7.542618016011753e-06, "loss": 1.3247, "step": 21665 }, { "epoch": 0.59, "learning_rate": 7.541760640751158e-06, "loss": 1.3958, "step": 21666 }, { "epoch": 0.59, "learning_rate": 7.540903284722671e-06, "loss": 1.2471, "step": 21667 }, { "epoch": 0.59, "learning_rate": 7.540045947933e-06, "loss": 1.2427, "step": 21668 }, { "epoch": 0.59, "learning_rate": 7.539188630388855e-06, "loss": 1.3032, "step": 21669 }, { "epoch": 0.59, "learning_rate": 7.538331332096938e-06, "loss": 1.2681, "step": 21670 }, { "epoch": 0.59, "learning_rate": 7.537474053063961e-06, "loss": 1.3477, "step": 21671 }, { "epoch": 0.59, "learning_rate": 7.536616793296629e-06, "loss": 1.2522, "step": 21672 }, { "epoch": 0.59, "learning_rate": 7.535759552801648e-06, "loss": 1.1404, "step": 21673 }, { "epoch": 0.59, "learning_rate": 7.534902331585725e-06, "loss": 1.3474, "step": 21674 }, { "epoch": 0.59, "learning_rate": 7.5340451296555695e-06, "loss": 1.2739, "step": 21675 }, { "epoch": 0.59, "learning_rate": 7.533187947017882e-06, "loss": 1.209, "step": 21676 }, { "epoch": 0.59, "learning_rate": 7.532330783679375e-06, "loss": 1.3728, "step": 21677 }, { "epoch": 0.59, "learning_rate": 7.531473639646749e-06, "loss": 1.4287, "step": 21678 }, { "epoch": 0.59, "learning_rate": 7.530616514926715e-06, "loss": 1.3215, "step": 21679 }, { "epoch": 0.59, "learning_rate": 7.529759409525974e-06, "loss": 1.2227, "step": 21680 }, { "epoch": 0.59, "learning_rate": 7.5289023234512315e-06, "loss": 1.2275, "step": 21681 }, { "epoch": 0.59, "learning_rate": 7.528045256709201e-06, "loss": 1.3062, "step": 21682 }, { "epoch": 0.59, "learning_rate": 7.527188209306576e-06, "loss": 1.1567, "step": 21683 }, { "epoch": 0.59, "learning_rate": 7.526331181250075e-06, "loss": 1.2644, "step": 21684 }, { "epoch": 0.59, "learning_rate": 7.525474172546389e-06, "loss": 1.2476, "step": 21685 }, { "epoch": 0.59, "learning_rate": 7.524617183202235e-06, "loss": 1.238, "step": 21686 }, { "epoch": 0.59, "learning_rate": 7.523760213224306e-06, "loss": 1.2083, "step": 21687 }, { "epoch": 0.59, "learning_rate": 7.522903262619319e-06, "loss": 1.3818, "step": 21688 }, { "epoch": 0.59, "learning_rate": 7.522046331393967e-06, "loss": 1.2683, "step": 21689 }, { "epoch": 0.59, "learning_rate": 7.521189419554964e-06, "loss": 1.3704, "step": 21690 }, { "epoch": 0.59, "learning_rate": 7.5203325271090036e-06, "loss": 1.2446, "step": 21691 }, { "epoch": 0.59, "learning_rate": 7.519475654062802e-06, "loss": 1.417, "step": 21692 }, { "epoch": 0.59, "learning_rate": 7.51861880042305e-06, "loss": 1.1848, "step": 21693 }, { "epoch": 0.59, "learning_rate": 7.517761966196464e-06, "loss": 1.26, "step": 21694 }, { "epoch": 0.59, "learning_rate": 7.516905151389734e-06, "loss": 1.1379, "step": 21695 }, { "epoch": 0.59, "learning_rate": 7.516048356009578e-06, "loss": 1.292, "step": 21696 }, { "epoch": 0.59, "learning_rate": 7.515191580062684e-06, "loss": 1.218, "step": 21697 }, { "epoch": 0.59, "learning_rate": 7.514334823555767e-06, "loss": 1.2744, "step": 21698 }, { "epoch": 0.59, "learning_rate": 7.513478086495525e-06, "loss": 1.3621, "step": 21699 }, { "epoch": 0.59, "learning_rate": 7.512621368888661e-06, "loss": 1.2893, "step": 21700 }, { "epoch": 0.59, "learning_rate": 7.511764670741879e-06, "loss": 1.2454, "step": 21701 }, { "epoch": 0.59, "learning_rate": 7.510907992061878e-06, "loss": 1.2241, "step": 21702 }, { "epoch": 0.59, "learning_rate": 7.510051332855365e-06, "loss": 1.3682, "step": 21703 }, { "epoch": 0.59, "learning_rate": 7.509194693129037e-06, "loss": 1.1782, "step": 21704 }, { "epoch": 0.59, "learning_rate": 7.5083380728896e-06, "loss": 1.3259, "step": 21705 }, { "epoch": 0.59, "learning_rate": 7.507481472143754e-06, "loss": 1.3599, "step": 21706 }, { "epoch": 0.59, "learning_rate": 7.506624890898202e-06, "loss": 1.1946, "step": 21707 }, { "epoch": 0.59, "learning_rate": 7.505768329159642e-06, "loss": 1.2498, "step": 21708 }, { "epoch": 0.59, "learning_rate": 7.50491178693478e-06, "loss": 1.3936, "step": 21709 }, { "epoch": 0.59, "learning_rate": 7.504055264230312e-06, "loss": 1.2886, "step": 21710 }, { "epoch": 0.59, "learning_rate": 7.503198761052945e-06, "loss": 1.3237, "step": 21711 }, { "epoch": 0.59, "learning_rate": 7.5023422774093745e-06, "loss": 1.179, "step": 21712 }, { "epoch": 0.59, "learning_rate": 7.501485813306304e-06, "loss": 1.0786, "step": 21713 }, { "epoch": 0.59, "learning_rate": 7.500629368750435e-06, "loss": 1.385, "step": 21714 }, { "epoch": 0.59, "learning_rate": 7.499772943748465e-06, "loss": 1.3979, "step": 21715 }, { "epoch": 0.59, "learning_rate": 7.498916538307097e-06, "loss": 1.2874, "step": 21716 }, { "epoch": 0.59, "learning_rate": 7.498060152433028e-06, "loss": 1.2009, "step": 21717 }, { "epoch": 0.59, "learning_rate": 7.497203786132963e-06, "loss": 1.2708, "step": 21718 }, { "epoch": 0.59, "learning_rate": 7.496347439413596e-06, "loss": 1.353, "step": 21719 }, { "epoch": 0.59, "learning_rate": 7.495491112281632e-06, "loss": 1.2271, "step": 21720 }, { "epoch": 0.59, "learning_rate": 7.494634804743766e-06, "loss": 1.1328, "step": 21721 }, { "epoch": 0.59, "learning_rate": 7.4937785168067e-06, "loss": 1.3149, "step": 21722 }, { "epoch": 0.59, "learning_rate": 7.49292224847713e-06, "loss": 1.7964, "step": 21723 }, { "epoch": 0.59, "learning_rate": 7.49206599976176e-06, "loss": 1.1802, "step": 21724 }, { "epoch": 0.59, "learning_rate": 7.491209770667285e-06, "loss": 1.2546, "step": 21725 }, { "epoch": 0.59, "learning_rate": 7.490353561200406e-06, "loss": 1.0999, "step": 21726 }, { "epoch": 0.59, "learning_rate": 7.48949737136782e-06, "loss": 1.2656, "step": 21727 }, { "epoch": 0.59, "learning_rate": 7.488641201176223e-06, "loss": 1.3635, "step": 21728 }, { "epoch": 0.59, "learning_rate": 7.487785050632322e-06, "loss": 1.3394, "step": 21729 }, { "epoch": 0.59, "learning_rate": 7.4869289197428045e-06, "loss": 1.209, "step": 21730 }, { "epoch": 0.59, "learning_rate": 7.486072808514378e-06, "loss": 1.3445, "step": 21731 }, { "epoch": 0.59, "learning_rate": 7.485216716953731e-06, "loss": 1.3494, "step": 21732 }, { "epoch": 0.59, "learning_rate": 7.484360645067572e-06, "loss": 1.2053, "step": 21733 }, { "epoch": 0.59, "learning_rate": 7.483504592862585e-06, "loss": 0.9946, "step": 21734 }, { "epoch": 0.59, "learning_rate": 7.482648560345482e-06, "loss": 1.2771, "step": 21735 }, { "epoch": 0.59, "learning_rate": 7.481792547522946e-06, "loss": 1.0972, "step": 21736 }, { "epoch": 0.59, "learning_rate": 7.480936554401688e-06, "loss": 1.2915, "step": 21737 }, { "epoch": 0.59, "learning_rate": 7.480080580988392e-06, "loss": 1.4795, "step": 21738 }, { "epoch": 0.59, "learning_rate": 7.479224627289765e-06, "loss": 1.3159, "step": 21739 }, { "epoch": 0.59, "learning_rate": 7.478368693312494e-06, "loss": 1.1702, "step": 21740 }, { "epoch": 0.59, "learning_rate": 7.477512779063288e-06, "loss": 1.4592, "step": 21741 }, { "epoch": 0.59, "learning_rate": 7.476656884548827e-06, "loss": 1.4114, "step": 21742 }, { "epoch": 0.59, "learning_rate": 7.47580100977582e-06, "loss": 1.0928, "step": 21743 }, { "epoch": 0.59, "learning_rate": 7.47494515475096e-06, "loss": 1.0702, "step": 21744 }, { "epoch": 0.59, "learning_rate": 7.4740893194809394e-06, "loss": 1.2346, "step": 21745 }, { "epoch": 0.59, "learning_rate": 7.473233503972459e-06, "loss": 1.4194, "step": 21746 }, { "epoch": 0.59, "learning_rate": 7.4723777082322105e-06, "loss": 1.2656, "step": 21747 }, { "epoch": 0.59, "learning_rate": 7.471521932266891e-06, "loss": 1.2617, "step": 21748 }, { "epoch": 0.59, "learning_rate": 7.470666176083193e-06, "loss": 1.418, "step": 21749 }, { "epoch": 0.59, "learning_rate": 7.469810439687815e-06, "loss": 1.2402, "step": 21750 }, { "epoch": 0.59, "learning_rate": 7.4689547230874495e-06, "loss": 1.2119, "step": 21751 }, { "epoch": 0.59, "learning_rate": 7.4680990262887935e-06, "loss": 1.3608, "step": 21752 }, { "epoch": 0.59, "learning_rate": 7.467243349298538e-06, "loss": 1.2083, "step": 21753 }, { "epoch": 0.59, "learning_rate": 7.466387692123381e-06, "loss": 1.3743, "step": 21754 }, { "epoch": 0.59, "learning_rate": 7.465532054770015e-06, "loss": 1.385, "step": 21755 }, { "epoch": 0.59, "learning_rate": 7.464676437245135e-06, "loss": 1.2764, "step": 21756 }, { "epoch": 0.59, "learning_rate": 7.463820839555432e-06, "loss": 1.4133, "step": 21757 }, { "epoch": 0.59, "learning_rate": 7.462965261707605e-06, "loss": 1.3291, "step": 21758 }, { "epoch": 0.59, "learning_rate": 7.4621097037083426e-06, "loss": 1.3303, "step": 21759 }, { "epoch": 0.59, "learning_rate": 7.461254165564341e-06, "loss": 1.251, "step": 21760 }, { "epoch": 0.59, "learning_rate": 7.4603986472822945e-06, "loss": 1.4126, "step": 21761 }, { "epoch": 0.59, "learning_rate": 7.459543148868893e-06, "loss": 1.3167, "step": 21762 }, { "epoch": 0.59, "learning_rate": 7.458687670330833e-06, "loss": 1.3005, "step": 21763 }, { "epoch": 0.59, "learning_rate": 7.457832211674803e-06, "loss": 1.356, "step": 21764 }, { "epoch": 0.59, "learning_rate": 7.4569767729075026e-06, "loss": 1.322, "step": 21765 }, { "epoch": 0.59, "learning_rate": 7.456121354035616e-06, "loss": 1.3962, "step": 21766 }, { "epoch": 0.59, "learning_rate": 7.455265955065842e-06, "loss": 1.2285, "step": 21767 }, { "epoch": 0.59, "learning_rate": 7.454410576004869e-06, "loss": 1.2925, "step": 21768 }, { "epoch": 0.59, "learning_rate": 7.453555216859394e-06, "loss": 1.2789, "step": 21769 }, { "epoch": 0.59, "learning_rate": 7.452699877636101e-06, "loss": 1.4004, "step": 21770 }, { "epoch": 0.59, "learning_rate": 7.45184455834169e-06, "loss": 1.2483, "step": 21771 }, { "epoch": 0.59, "learning_rate": 7.4509892589828455e-06, "loss": 1.1511, "step": 21772 }, { "epoch": 0.59, "learning_rate": 7.450133979566265e-06, "loss": 1.1472, "step": 21773 }, { "epoch": 0.59, "learning_rate": 7.449278720098636e-06, "loss": 1.3757, "step": 21774 }, { "epoch": 0.59, "learning_rate": 7.448423480586648e-06, "loss": 1.2861, "step": 21775 }, { "epoch": 0.59, "learning_rate": 7.447568261037001e-06, "loss": 1.2693, "step": 21776 }, { "epoch": 0.59, "learning_rate": 7.446713061456375e-06, "loss": 1.2739, "step": 21777 }, { "epoch": 0.59, "learning_rate": 7.445857881851471e-06, "loss": 1.4141, "step": 21778 }, { "epoch": 0.59, "learning_rate": 7.445002722228967e-06, "loss": 1.1528, "step": 21779 }, { "epoch": 0.59, "learning_rate": 7.444147582595567e-06, "loss": 1.3877, "step": 21780 }, { "epoch": 0.59, "learning_rate": 7.443292462957947e-06, "loss": 1.0714, "step": 21781 }, { "epoch": 0.59, "learning_rate": 7.442437363322812e-06, "loss": 1.1938, "step": 21782 }, { "epoch": 0.59, "learning_rate": 7.441582283696837e-06, "loss": 1.3911, "step": 21783 }, { "epoch": 0.59, "learning_rate": 7.440727224086725e-06, "loss": 1.2993, "step": 21784 }, { "epoch": 0.59, "learning_rate": 7.439872184499155e-06, "loss": 1.2661, "step": 21785 }, { "epoch": 0.59, "learning_rate": 7.439017164940827e-06, "loss": 1.3276, "step": 21786 }, { "epoch": 0.59, "learning_rate": 7.438162165418419e-06, "loss": 1.2761, "step": 21787 }, { "epoch": 0.6, "learning_rate": 7.437307185938631e-06, "loss": 1.2886, "step": 21788 }, { "epoch": 0.6, "learning_rate": 7.436452226508141e-06, "loss": 1.2039, "step": 21789 }, { "epoch": 0.6, "learning_rate": 7.4355972871336445e-06, "loss": 1.3062, "step": 21790 }, { "epoch": 0.6, "learning_rate": 7.434742367821831e-06, "loss": 1.3298, "step": 21791 }, { "epoch": 0.6, "learning_rate": 7.433887468579385e-06, "loss": 1.4097, "step": 21792 }, { "epoch": 0.6, "learning_rate": 7.433032589412998e-06, "loss": 1.3262, "step": 21793 }, { "epoch": 0.6, "learning_rate": 7.432177730329358e-06, "loss": 1.2896, "step": 21794 }, { "epoch": 0.6, "learning_rate": 7.431322891335151e-06, "loss": 1.0679, "step": 21795 }, { "epoch": 0.6, "learning_rate": 7.430468072437064e-06, "loss": 1.269, "step": 21796 }, { "epoch": 0.6, "learning_rate": 7.429613273641789e-06, "loss": 1.2415, "step": 21797 }, { "epoch": 0.6, "learning_rate": 7.42875849495601e-06, "loss": 1.3723, "step": 21798 }, { "epoch": 0.6, "learning_rate": 7.427903736386417e-06, "loss": 1.2026, "step": 21799 }, { "epoch": 0.6, "learning_rate": 7.427048997939693e-06, "loss": 1.2678, "step": 21800 }, { "epoch": 0.6, "learning_rate": 7.42619427962253e-06, "loss": 1.7422, "step": 21801 }, { "epoch": 0.6, "learning_rate": 7.425339581441611e-06, "loss": 1.3318, "step": 21802 }, { "epoch": 0.6, "learning_rate": 7.424484903403626e-06, "loss": 1.2117, "step": 21803 }, { "epoch": 0.6, "learning_rate": 7.4236302455152585e-06, "loss": 1.3184, "step": 21804 }, { "epoch": 0.6, "learning_rate": 7.422775607783197e-06, "loss": 1.2883, "step": 21805 }, { "epoch": 0.6, "learning_rate": 7.4219209902141275e-06, "loss": 1.2358, "step": 21806 }, { "epoch": 0.6, "learning_rate": 7.421066392814736e-06, "loss": 1.1394, "step": 21807 }, { "epoch": 0.6, "learning_rate": 7.420211815591709e-06, "loss": 1.1997, "step": 21808 }, { "epoch": 0.6, "learning_rate": 7.4193572585517295e-06, "loss": 1.397, "step": 21809 }, { "epoch": 0.6, "learning_rate": 7.4185027217014875e-06, "loss": 1.2671, "step": 21810 }, { "epoch": 0.6, "learning_rate": 7.417648205047665e-06, "loss": 1.2112, "step": 21811 }, { "epoch": 0.6, "learning_rate": 7.41679370859695e-06, "loss": 1.6816, "step": 21812 }, { "epoch": 0.6, "learning_rate": 7.4159392323560245e-06, "loss": 1.2539, "step": 21813 }, { "epoch": 0.6, "learning_rate": 7.4150847763315755e-06, "loss": 1.1675, "step": 21814 }, { "epoch": 0.6, "learning_rate": 7.414230340530289e-06, "loss": 1.3984, "step": 21815 }, { "epoch": 0.6, "learning_rate": 7.413375924958848e-06, "loss": 1.2217, "step": 21816 }, { "epoch": 0.6, "learning_rate": 7.412521529623937e-06, "loss": 1.2637, "step": 21817 }, { "epoch": 0.6, "learning_rate": 7.411667154532241e-06, "loss": 1.1396, "step": 21818 }, { "epoch": 0.6, "learning_rate": 7.4108127996904434e-06, "loss": 1.2344, "step": 21819 }, { "epoch": 0.6, "learning_rate": 7.409958465105232e-06, "loss": 1.377, "step": 21820 }, { "epoch": 0.6, "learning_rate": 7.409104150783284e-06, "loss": 1.3826, "step": 21821 }, { "epoch": 0.6, "learning_rate": 7.408249856731284e-06, "loss": 1.2712, "step": 21822 }, { "epoch": 0.6, "learning_rate": 7.4073955829559265e-06, "loss": 1.2007, "step": 21823 }, { "epoch": 0.6, "learning_rate": 7.406541329463879e-06, "loss": 1.1965, "step": 21824 }, { "epoch": 0.6, "learning_rate": 7.40568709626184e-06, "loss": 1.1724, "step": 21825 }, { "epoch": 0.6, "learning_rate": 7.404832883356479e-06, "loss": 1.2107, "step": 21826 }, { "epoch": 0.6, "learning_rate": 7.4039786907544905e-06, "loss": 1.2346, "step": 21827 }, { "epoch": 0.6, "learning_rate": 7.403124518462547e-06, "loss": 1.3364, "step": 21828 }, { "epoch": 0.6, "learning_rate": 7.402270366487341e-06, "loss": 1.2091, "step": 21829 }, { "epoch": 0.6, "learning_rate": 7.401416234835545e-06, "loss": 1.1289, "step": 21830 }, { "epoch": 0.6, "learning_rate": 7.400562123513852e-06, "loss": 1.312, "step": 21831 }, { "epoch": 0.6, "learning_rate": 7.399708032528933e-06, "loss": 1.343, "step": 21832 }, { "epoch": 0.6, "learning_rate": 7.398853961887481e-06, "loss": 1.7158, "step": 21833 }, { "epoch": 0.6, "learning_rate": 7.397999911596167e-06, "loss": 1.7397, "step": 21834 }, { "epoch": 0.6, "learning_rate": 7.397145881661683e-06, "loss": 1.3201, "step": 21835 }, { "epoch": 0.6, "learning_rate": 7.396291872090702e-06, "loss": 1.4731, "step": 21836 }, { "epoch": 0.6, "learning_rate": 7.3954378828899084e-06, "loss": 1.3237, "step": 21837 }, { "epoch": 0.6, "learning_rate": 7.394583914065987e-06, "loss": 1.4209, "step": 21838 }, { "epoch": 0.6, "learning_rate": 7.3937299656256145e-06, "loss": 1.2815, "step": 21839 }, { "epoch": 0.6, "learning_rate": 7.392876037575475e-06, "loss": 1.2532, "step": 21840 }, { "epoch": 0.6, "learning_rate": 7.392022129922245e-06, "loss": 1.293, "step": 21841 }, { "epoch": 0.6, "learning_rate": 7.3911682426726105e-06, "loss": 1.2437, "step": 21842 }, { "epoch": 0.6, "learning_rate": 7.390314375833245e-06, "loss": 1.2937, "step": 21843 }, { "epoch": 0.6, "learning_rate": 7.389460529410837e-06, "loss": 1.2266, "step": 21844 }, { "epoch": 0.6, "learning_rate": 7.388606703412059e-06, "loss": 1.3044, "step": 21845 }, { "epoch": 0.6, "learning_rate": 7.387752897843596e-06, "loss": 1.3975, "step": 21846 }, { "epoch": 0.6, "learning_rate": 7.386899112712125e-06, "loss": 1.269, "step": 21847 }, { "epoch": 0.6, "learning_rate": 7.386045348024327e-06, "loss": 1.2148, "step": 21848 }, { "epoch": 0.6, "learning_rate": 7.385191603786881e-06, "loss": 1.3518, "step": 21849 }, { "epoch": 0.6, "learning_rate": 7.384337880006467e-06, "loss": 1.2839, "step": 21850 }, { "epoch": 0.6, "learning_rate": 7.383484176689762e-06, "loss": 1.2192, "step": 21851 }, { "epoch": 0.6, "learning_rate": 7.3826304938434456e-06, "loss": 1.3484, "step": 21852 }, { "epoch": 0.6, "learning_rate": 7.381776831474199e-06, "loss": 1.3115, "step": 21853 }, { "epoch": 0.6, "learning_rate": 7.380923189588698e-06, "loss": 1.3452, "step": 21854 }, { "epoch": 0.6, "learning_rate": 7.380069568193625e-06, "loss": 1.1538, "step": 21855 }, { "epoch": 0.6, "learning_rate": 7.379215967295654e-06, "loss": 1.3052, "step": 21856 }, { "epoch": 0.6, "learning_rate": 7.378362386901465e-06, "loss": 1.3811, "step": 21857 }, { "epoch": 0.6, "learning_rate": 7.377508827017736e-06, "loss": 1.343, "step": 21858 }, { "epoch": 0.6, "learning_rate": 7.3766552876511466e-06, "loss": 1.3481, "step": 21859 }, { "epoch": 0.6, "learning_rate": 7.3758017688083695e-06, "loss": 1.1289, "step": 21860 }, { "epoch": 0.6, "learning_rate": 7.374948270496087e-06, "loss": 1.3225, "step": 21861 }, { "epoch": 0.6, "learning_rate": 7.374094792720974e-06, "loss": 1.2844, "step": 21862 }, { "epoch": 0.6, "learning_rate": 7.37324133548971e-06, "loss": 1.4355, "step": 21863 }, { "epoch": 0.6, "learning_rate": 7.372387898808969e-06, "loss": 1.3359, "step": 21864 }, { "epoch": 0.6, "learning_rate": 7.371534482685432e-06, "loss": 0.8721, "step": 21865 }, { "epoch": 0.6, "learning_rate": 7.370681087125771e-06, "loss": 1.355, "step": 21866 }, { "epoch": 0.6, "learning_rate": 7.369827712136661e-06, "loss": 1.3105, "step": 21867 }, { "epoch": 0.6, "learning_rate": 7.368974357724789e-06, "loss": 1.373, "step": 21868 }, { "epoch": 0.6, "learning_rate": 7.368121023896819e-06, "loss": 1.2407, "step": 21869 }, { "epoch": 0.6, "learning_rate": 7.3672677106594394e-06, "loss": 1.2859, "step": 21870 }, { "epoch": 0.6, "learning_rate": 7.366414418019312e-06, "loss": 1.2415, "step": 21871 }, { "epoch": 0.6, "learning_rate": 7.365561145983127e-06, "loss": 1.386, "step": 21872 }, { "epoch": 0.6, "learning_rate": 7.364707894557544e-06, "loss": 1.1926, "step": 21873 }, { "epoch": 0.6, "learning_rate": 7.363854663749256e-06, "loss": 1.2273, "step": 21874 }, { "epoch": 0.6, "learning_rate": 7.3630014535649216e-06, "loss": 1.3687, "step": 21875 }, { "epoch": 0.6, "learning_rate": 7.362148264011232e-06, "loss": 1.4272, "step": 21876 }, { "epoch": 0.6, "learning_rate": 7.361295095094847e-06, "loss": 1.2834, "step": 21877 }, { "epoch": 0.6, "learning_rate": 7.360441946822454e-06, "loss": 1.2886, "step": 21878 }, { "epoch": 0.6, "learning_rate": 7.3595888192007155e-06, "loss": 1.417, "step": 21879 }, { "epoch": 0.6, "learning_rate": 7.358735712236318e-06, "loss": 1.481, "step": 21880 }, { "epoch": 0.6, "learning_rate": 7.357882625935927e-06, "loss": 1.3284, "step": 21881 }, { "epoch": 0.6, "learning_rate": 7.3570295603062224e-06, "loss": 1.2522, "step": 21882 }, { "epoch": 0.6, "learning_rate": 7.356176515353873e-06, "loss": 1.2905, "step": 21883 }, { "epoch": 0.6, "learning_rate": 7.3553234910855566e-06, "loss": 1.1628, "step": 21884 }, { "epoch": 0.6, "learning_rate": 7.354470487507948e-06, "loss": 1.3423, "step": 21885 }, { "epoch": 0.6, "learning_rate": 7.353617504627715e-06, "loss": 1.3721, "step": 21886 }, { "epoch": 0.6, "learning_rate": 7.352764542451536e-06, "loss": 1.2156, "step": 21887 }, { "epoch": 0.6, "learning_rate": 7.351911600986081e-06, "loss": 1.2747, "step": 21888 }, { "epoch": 0.6, "learning_rate": 7.351058680238025e-06, "loss": 1.3413, "step": 21889 }, { "epoch": 0.6, "learning_rate": 7.35020578021404e-06, "loss": 1.2476, "step": 21890 }, { "epoch": 0.6, "learning_rate": 7.349352900920801e-06, "loss": 1.2075, "step": 21891 }, { "epoch": 0.6, "learning_rate": 7.3485000423649755e-06, "loss": 1.2324, "step": 21892 }, { "epoch": 0.6, "learning_rate": 7.347647204553241e-06, "loss": 1.1763, "step": 21893 }, { "epoch": 0.6, "learning_rate": 7.3467943874922665e-06, "loss": 1.2441, "step": 21894 }, { "epoch": 0.6, "learning_rate": 7.345941591188727e-06, "loss": 1.2778, "step": 21895 }, { "epoch": 0.6, "learning_rate": 7.34508881564929e-06, "loss": 1.1531, "step": 21896 }, { "epoch": 0.6, "learning_rate": 7.344236060880632e-06, "loss": 1.3369, "step": 21897 }, { "epoch": 0.6, "learning_rate": 7.343383326889419e-06, "loss": 1.2737, "step": 21898 }, { "epoch": 0.6, "learning_rate": 7.342530613682326e-06, "loss": 1.2305, "step": 21899 }, { "epoch": 0.6, "learning_rate": 7.341677921266026e-06, "loss": 1.1125, "step": 21900 }, { "epoch": 0.6, "learning_rate": 7.340825249647188e-06, "loss": 1.3025, "step": 21901 }, { "epoch": 0.6, "learning_rate": 7.3399725988324826e-06, "loss": 1.334, "step": 21902 }, { "epoch": 0.6, "learning_rate": 7.339119968828579e-06, "loss": 1.5908, "step": 21903 }, { "epoch": 0.6, "learning_rate": 7.338267359642151e-06, "loss": 1.2122, "step": 21904 }, { "epoch": 0.6, "learning_rate": 7.337414771279867e-06, "loss": 1.7148, "step": 21905 }, { "epoch": 0.6, "learning_rate": 7.336562203748399e-06, "loss": 1.3181, "step": 21906 }, { "epoch": 0.6, "learning_rate": 7.335709657054413e-06, "loss": 1.314, "step": 21907 }, { "epoch": 0.6, "learning_rate": 7.334857131204585e-06, "loss": 1.2361, "step": 21908 }, { "epoch": 0.6, "learning_rate": 7.33400462620558e-06, "loss": 1.4385, "step": 21909 }, { "epoch": 0.6, "learning_rate": 7.33315214206407e-06, "loss": 1.2292, "step": 21910 }, { "epoch": 0.6, "learning_rate": 7.3322996787867225e-06, "loss": 1.3438, "step": 21911 }, { "epoch": 0.6, "learning_rate": 7.331447236380209e-06, "loss": 1.0466, "step": 21912 }, { "epoch": 0.6, "learning_rate": 7.330594814851194e-06, "loss": 1.3989, "step": 21913 }, { "epoch": 0.6, "learning_rate": 7.329742414206351e-06, "loss": 1.2952, "step": 21914 }, { "epoch": 0.6, "learning_rate": 7.3288900344523515e-06, "loss": 1.241, "step": 21915 }, { "epoch": 0.6, "learning_rate": 7.328037675595858e-06, "loss": 1.2759, "step": 21916 }, { "epoch": 0.6, "learning_rate": 7.327185337643542e-06, "loss": 1.2212, "step": 21917 }, { "epoch": 0.6, "learning_rate": 7.32633302060207e-06, "loss": 1.2383, "step": 21918 }, { "epoch": 0.6, "learning_rate": 7.325480724478113e-06, "loss": 1.2661, "step": 21919 }, { "epoch": 0.6, "learning_rate": 7.3246284492783345e-06, "loss": 1.2971, "step": 21920 }, { "epoch": 0.6, "learning_rate": 7.323776195009409e-06, "loss": 1.71, "step": 21921 }, { "epoch": 0.6, "learning_rate": 7.3229239616779955e-06, "loss": 1.1543, "step": 21922 }, { "epoch": 0.6, "learning_rate": 7.322071749290769e-06, "loss": 1.2402, "step": 21923 }, { "epoch": 0.6, "learning_rate": 7.321219557854393e-06, "loss": 1.2695, "step": 21924 }, { "epoch": 0.6, "learning_rate": 7.320367387375537e-06, "loss": 1.3296, "step": 21925 }, { "epoch": 0.6, "learning_rate": 7.319515237860863e-06, "loss": 1.2556, "step": 21926 }, { "epoch": 0.6, "learning_rate": 7.318663109317046e-06, "loss": 1.2136, "step": 21927 }, { "epoch": 0.6, "learning_rate": 7.317811001750743e-06, "loss": 1.3057, "step": 21928 }, { "epoch": 0.6, "learning_rate": 7.316958915168628e-06, "loss": 1.3308, "step": 21929 }, { "epoch": 0.6, "learning_rate": 7.316106849577365e-06, "loss": 1.0881, "step": 21930 }, { "epoch": 0.6, "learning_rate": 7.31525480498362e-06, "loss": 1.3933, "step": 21931 }, { "epoch": 0.6, "learning_rate": 7.314402781394059e-06, "loss": 1.0471, "step": 21932 }, { "epoch": 0.6, "learning_rate": 7.313550778815346e-06, "loss": 1.2642, "step": 21933 }, { "epoch": 0.6, "learning_rate": 7.312698797254151e-06, "loss": 1.3425, "step": 21934 }, { "epoch": 0.6, "learning_rate": 7.311846836717135e-06, "loss": 1.2151, "step": 21935 }, { "epoch": 0.6, "learning_rate": 7.310994897210967e-06, "loss": 1.3408, "step": 21936 }, { "epoch": 0.6, "learning_rate": 7.310142978742309e-06, "loss": 1.3169, "step": 21937 }, { "epoch": 0.6, "learning_rate": 7.3092910813178286e-06, "loss": 1.1671, "step": 21938 }, { "epoch": 0.6, "learning_rate": 7.308439204944189e-06, "loss": 1.2542, "step": 21939 }, { "epoch": 0.6, "learning_rate": 7.307587349628056e-06, "loss": 1.3606, "step": 21940 }, { "epoch": 0.6, "learning_rate": 7.306735515376091e-06, "loss": 1.3105, "step": 21941 }, { "epoch": 0.6, "learning_rate": 7.305883702194964e-06, "loss": 1.2712, "step": 21942 }, { "epoch": 0.6, "learning_rate": 7.305031910091333e-06, "loss": 1.2922, "step": 21943 }, { "epoch": 0.6, "learning_rate": 7.304180139071868e-06, "loss": 1.262, "step": 21944 }, { "epoch": 0.6, "learning_rate": 7.3033283891432294e-06, "loss": 1.2644, "step": 21945 }, { "epoch": 0.6, "learning_rate": 7.302476660312077e-06, "loss": 1.3215, "step": 21946 }, { "epoch": 0.6, "learning_rate": 7.301624952585086e-06, "loss": 1.0691, "step": 21947 }, { "epoch": 0.6, "learning_rate": 7.300773265968905e-06, "loss": 1.3164, "step": 21948 }, { "epoch": 0.6, "learning_rate": 7.299921600470212e-06, "loss": 1.2966, "step": 21949 }, { "epoch": 0.6, "learning_rate": 7.299069956095657e-06, "loss": 1.3811, "step": 21950 }, { "epoch": 0.6, "learning_rate": 7.298218332851914e-06, "loss": 1.2705, "step": 21951 }, { "epoch": 0.6, "learning_rate": 7.297366730745634e-06, "loss": 1.2327, "step": 21952 }, { "epoch": 0.6, "learning_rate": 7.296515149783493e-06, "loss": 1.2371, "step": 21953 }, { "epoch": 0.6, "learning_rate": 7.295663589972139e-06, "loss": 1.1833, "step": 21954 }, { "epoch": 0.6, "learning_rate": 7.294812051318247e-06, "loss": 1.2524, "step": 21955 }, { "epoch": 0.6, "learning_rate": 7.293960533828469e-06, "loss": 1.3203, "step": 21956 }, { "epoch": 0.6, "learning_rate": 7.293109037509477e-06, "loss": 1.1594, "step": 21957 }, { "epoch": 0.6, "learning_rate": 7.29225756236792e-06, "loss": 1.2244, "step": 21958 }, { "epoch": 0.6, "learning_rate": 7.291406108410475e-06, "loss": 1.2866, "step": 21959 }, { "epoch": 0.6, "learning_rate": 7.290554675643786e-06, "loss": 1.2371, "step": 21960 }, { "epoch": 0.6, "learning_rate": 7.289703264074526e-06, "loss": 1.3164, "step": 21961 }, { "epoch": 0.6, "learning_rate": 7.288851873709355e-06, "loss": 1.2715, "step": 21962 }, { "epoch": 0.6, "learning_rate": 7.288000504554931e-06, "loss": 1.3557, "step": 21963 }, { "epoch": 0.6, "learning_rate": 7.287149156617917e-06, "loss": 1.1958, "step": 21964 }, { "epoch": 0.6, "learning_rate": 7.286297829904971e-06, "loss": 1.3088, "step": 21965 }, { "epoch": 0.6, "learning_rate": 7.285446524422757e-06, "loss": 1.3545, "step": 21966 }, { "epoch": 0.6, "learning_rate": 7.28459524017793e-06, "loss": 1.4192, "step": 21967 }, { "epoch": 0.6, "learning_rate": 7.283743977177155e-06, "loss": 1.3379, "step": 21968 }, { "epoch": 0.6, "learning_rate": 7.282892735427087e-06, "loss": 1.2214, "step": 21969 }, { "epoch": 0.6, "learning_rate": 7.282041514934393e-06, "loss": 1.3025, "step": 21970 }, { "epoch": 0.6, "learning_rate": 7.281190315705724e-06, "loss": 1.4111, "step": 21971 }, { "epoch": 0.6, "learning_rate": 7.2803391377477475e-06, "loss": 1.304, "step": 21972 }, { "epoch": 0.6, "learning_rate": 7.2794879810671145e-06, "loss": 1.2461, "step": 21973 }, { "epoch": 0.6, "learning_rate": 7.278636845670492e-06, "loss": 1.2715, "step": 21974 }, { "epoch": 0.6, "learning_rate": 7.277785731564531e-06, "loss": 1.3213, "step": 21975 }, { "epoch": 0.6, "learning_rate": 7.276934638755897e-06, "loss": 1.29, "step": 21976 }, { "epoch": 0.6, "learning_rate": 7.276083567251247e-06, "loss": 1.2341, "step": 21977 }, { "epoch": 0.6, "learning_rate": 7.275232517057236e-06, "loss": 1.1533, "step": 21978 }, { "epoch": 0.6, "learning_rate": 7.274381488180526e-06, "loss": 1.012, "step": 21979 }, { "epoch": 0.6, "learning_rate": 7.273530480627772e-06, "loss": 1.0739, "step": 21980 }, { "epoch": 0.6, "learning_rate": 7.272679494405634e-06, "loss": 1.3748, "step": 21981 }, { "epoch": 0.6, "learning_rate": 7.27182852952077e-06, "loss": 1.2773, "step": 21982 }, { "epoch": 0.6, "learning_rate": 7.270977585979837e-06, "loss": 1.2102, "step": 21983 }, { "epoch": 0.6, "learning_rate": 7.2701266637894905e-06, "loss": 1.177, "step": 21984 }, { "epoch": 0.6, "learning_rate": 7.269275762956392e-06, "loss": 1.3247, "step": 21985 }, { "epoch": 0.6, "learning_rate": 7.2684248834871925e-06, "loss": 1.04, "step": 21986 }, { "epoch": 0.6, "learning_rate": 7.267574025388555e-06, "loss": 1.2422, "step": 21987 }, { "epoch": 0.6, "learning_rate": 7.266723188667131e-06, "loss": 1.2266, "step": 21988 }, { "epoch": 0.6, "learning_rate": 7.265872373329581e-06, "loss": 1.1128, "step": 21989 }, { "epoch": 0.6, "learning_rate": 7.265021579382559e-06, "loss": 1.416, "step": 21990 }, { "epoch": 0.6, "learning_rate": 7.264170806832724e-06, "loss": 1.3169, "step": 21991 }, { "epoch": 0.6, "learning_rate": 7.263320055686728e-06, "loss": 1.2175, "step": 21992 }, { "epoch": 0.6, "learning_rate": 7.262469325951227e-06, "loss": 1.1816, "step": 21993 }, { "epoch": 0.6, "learning_rate": 7.261618617632884e-06, "loss": 1.1511, "step": 21994 }, { "epoch": 0.6, "learning_rate": 7.260767930738344e-06, "loss": 1.2998, "step": 21995 }, { "epoch": 0.6, "learning_rate": 7.259917265274274e-06, "loss": 1.301, "step": 21996 }, { "epoch": 0.6, "learning_rate": 7.259066621247316e-06, "loss": 1.2227, "step": 21997 }, { "epoch": 0.6, "learning_rate": 7.258215998664137e-06, "loss": 1.2419, "step": 21998 }, { "epoch": 0.6, "learning_rate": 7.257365397531383e-06, "loss": 1.2009, "step": 21999 }, { "epoch": 0.6, "learning_rate": 7.256514817855717e-06, "loss": 1.3835, "step": 22000 }, { "epoch": 0.6, "learning_rate": 7.255664259643784e-06, "loss": 1.1733, "step": 22001 }, { "epoch": 0.6, "learning_rate": 7.2548137229022485e-06, "loss": 1.3894, "step": 22002 }, { "epoch": 0.6, "learning_rate": 7.253963207637753e-06, "loss": 1.2383, "step": 22003 }, { "epoch": 0.6, "learning_rate": 7.253112713856966e-06, "loss": 1.1465, "step": 22004 }, { "epoch": 0.6, "learning_rate": 7.252262241566526e-06, "loss": 1.3198, "step": 22005 }, { "epoch": 0.6, "learning_rate": 7.2514117907731e-06, "loss": 1.3005, "step": 22006 }, { "epoch": 0.6, "learning_rate": 7.25056136148333e-06, "loss": 1.2947, "step": 22007 }, { "epoch": 0.6, "learning_rate": 7.249710953703876e-06, "loss": 1.3367, "step": 22008 }, { "epoch": 0.6, "learning_rate": 7.248860567441395e-06, "loss": 1.4187, "step": 22009 }, { "epoch": 0.6, "learning_rate": 7.248010202702531e-06, "loss": 1.4844, "step": 22010 }, { "epoch": 0.6, "learning_rate": 7.247159859493944e-06, "loss": 1.7051, "step": 22011 }, { "epoch": 0.6, "learning_rate": 7.246309537822282e-06, "loss": 1.1975, "step": 22012 }, { "epoch": 0.6, "learning_rate": 7.245459237694201e-06, "loss": 1.2029, "step": 22013 }, { "epoch": 0.6, "learning_rate": 7.2446089591163485e-06, "loss": 1.1619, "step": 22014 }, { "epoch": 0.6, "learning_rate": 7.243758702095382e-06, "loss": 1.3081, "step": 22015 }, { "epoch": 0.6, "learning_rate": 7.242908466637951e-06, "loss": 1.3142, "step": 22016 }, { "epoch": 0.6, "learning_rate": 7.24205825275071e-06, "loss": 1.2942, "step": 22017 }, { "epoch": 0.6, "learning_rate": 7.241208060440305e-06, "loss": 1.2559, "step": 22018 }, { "epoch": 0.6, "learning_rate": 7.240357889713392e-06, "loss": 1.0957, "step": 22019 }, { "epoch": 0.6, "learning_rate": 7.2395077405766215e-06, "loss": 1.2532, "step": 22020 }, { "epoch": 0.6, "learning_rate": 7.238657613036644e-06, "loss": 1.2224, "step": 22021 }, { "epoch": 0.6, "learning_rate": 7.23780750710011e-06, "loss": 1.0996, "step": 22022 }, { "epoch": 0.6, "learning_rate": 7.236957422773672e-06, "loss": 1.3564, "step": 22023 }, { "epoch": 0.6, "learning_rate": 7.2361073600639794e-06, "loss": 1.3584, "step": 22024 }, { "epoch": 0.6, "learning_rate": 7.235257318977684e-06, "loss": 1.1982, "step": 22025 }, { "epoch": 0.6, "learning_rate": 7.234407299521435e-06, "loss": 1.1868, "step": 22026 }, { "epoch": 0.6, "learning_rate": 7.2335573017018825e-06, "loss": 1.2041, "step": 22027 }, { "epoch": 0.6, "learning_rate": 7.232707325525678e-06, "loss": 1.2507, "step": 22028 }, { "epoch": 0.6, "learning_rate": 7.231857370999469e-06, "loss": 1.0857, "step": 22029 }, { "epoch": 0.6, "learning_rate": 7.231007438129907e-06, "loss": 1.3225, "step": 22030 }, { "epoch": 0.6, "learning_rate": 7.230157526923639e-06, "loss": 1.2329, "step": 22031 }, { "epoch": 0.6, "learning_rate": 7.2293076373873186e-06, "loss": 1.3489, "step": 22032 }, { "epoch": 0.6, "learning_rate": 7.22845776952759e-06, "loss": 1.239, "step": 22033 }, { "epoch": 0.6, "learning_rate": 7.227607923351105e-06, "loss": 1.2451, "step": 22034 }, { "epoch": 0.6, "learning_rate": 7.2267580988645126e-06, "loss": 1.2568, "step": 22035 }, { "epoch": 0.6, "learning_rate": 7.225908296074462e-06, "loss": 1.3083, "step": 22036 }, { "epoch": 0.6, "learning_rate": 7.225058514987597e-06, "loss": 1.4016, "step": 22037 }, { "epoch": 0.6, "learning_rate": 7.224208755610569e-06, "loss": 1.2788, "step": 22038 }, { "epoch": 0.6, "learning_rate": 7.223359017950031e-06, "loss": 1.1904, "step": 22039 }, { "epoch": 0.6, "learning_rate": 7.222509302012622e-06, "loss": 1.2556, "step": 22040 }, { "epoch": 0.6, "learning_rate": 7.221659607804999e-06, "loss": 1.2446, "step": 22041 }, { "epoch": 0.6, "learning_rate": 7.220809935333799e-06, "loss": 1.2065, "step": 22042 }, { "epoch": 0.6, "learning_rate": 7.219960284605682e-06, "loss": 1.2122, "step": 22043 }, { "epoch": 0.6, "learning_rate": 7.2191106556272815e-06, "loss": 1.3752, "step": 22044 }, { "epoch": 0.6, "learning_rate": 7.218261048405257e-06, "loss": 1.2642, "step": 22045 }, { "epoch": 0.6, "learning_rate": 7.217411462946246e-06, "loss": 1.4592, "step": 22046 }, { "epoch": 0.6, "learning_rate": 7.216561899256904e-06, "loss": 1.2126, "step": 22047 }, { "epoch": 0.6, "learning_rate": 7.215712357343867e-06, "loss": 1.3491, "step": 22048 }, { "epoch": 0.6, "learning_rate": 7.214862837213793e-06, "loss": 1.1831, "step": 22049 }, { "epoch": 0.6, "learning_rate": 7.214013338873316e-06, "loss": 1.2527, "step": 22050 }, { "epoch": 0.6, "learning_rate": 7.213163862329095e-06, "loss": 1.3557, "step": 22051 }, { "epoch": 0.6, "learning_rate": 7.212314407587764e-06, "loss": 1.2983, "step": 22052 }, { "epoch": 0.6, "learning_rate": 7.211464974655981e-06, "loss": 1.2021, "step": 22053 }, { "epoch": 0.6, "learning_rate": 7.210615563540377e-06, "loss": 1.479, "step": 22054 }, { "epoch": 0.6, "learning_rate": 7.2097661742476075e-06, "loss": 1.2412, "step": 22055 }, { "epoch": 0.6, "learning_rate": 7.2089168067843185e-06, "loss": 1.2537, "step": 22056 }, { "epoch": 0.6, "learning_rate": 7.208067461157148e-06, "loss": 1.3403, "step": 22057 }, { "epoch": 0.6, "learning_rate": 7.207218137372749e-06, "loss": 1.2998, "step": 22058 }, { "epoch": 0.6, "learning_rate": 7.206368835437758e-06, "loss": 1.48, "step": 22059 }, { "epoch": 0.6, "learning_rate": 7.2055195553588275e-06, "loss": 1.2771, "step": 22060 }, { "epoch": 0.6, "learning_rate": 7.204670297142595e-06, "loss": 1.3293, "step": 22061 }, { "epoch": 0.6, "learning_rate": 7.2038210607957105e-06, "loss": 1.2285, "step": 22062 }, { "epoch": 0.6, "learning_rate": 7.202971846324811e-06, "loss": 1.3735, "step": 22063 }, { "epoch": 0.6, "learning_rate": 7.2021226537365485e-06, "loss": 1.4695, "step": 22064 }, { "epoch": 0.6, "learning_rate": 7.2012734830375604e-06, "loss": 1.4028, "step": 22065 }, { "epoch": 0.6, "learning_rate": 7.2004243342344935e-06, "loss": 1.4224, "step": 22066 }, { "epoch": 0.6, "learning_rate": 7.1995752073339885e-06, "loss": 1.3523, "step": 22067 }, { "epoch": 0.6, "learning_rate": 7.198726102342694e-06, "loss": 1.2937, "step": 22068 }, { "epoch": 0.6, "learning_rate": 7.1978770192672456e-06, "loss": 1.2402, "step": 22069 }, { "epoch": 0.6, "learning_rate": 7.197027958114289e-06, "loss": 1.1516, "step": 22070 }, { "epoch": 0.6, "learning_rate": 7.196178918890471e-06, "loss": 1.2681, "step": 22071 }, { "epoch": 0.6, "learning_rate": 7.195329901602428e-06, "loss": 1.2131, "step": 22072 }, { "epoch": 0.6, "learning_rate": 7.194480906256808e-06, "loss": 1.2959, "step": 22073 }, { "epoch": 0.6, "learning_rate": 7.193631932860248e-06, "loss": 1.2124, "step": 22074 }, { "epoch": 0.6, "learning_rate": 7.192782981419393e-06, "loss": 1.3267, "step": 22075 }, { "epoch": 0.6, "learning_rate": 7.191934051940882e-06, "loss": 1.3196, "step": 22076 }, { "epoch": 0.6, "learning_rate": 7.191085144431361e-06, "loss": 1.3721, "step": 22077 }, { "epoch": 0.6, "learning_rate": 7.190236258897467e-06, "loss": 1.2449, "step": 22078 }, { "epoch": 0.6, "learning_rate": 7.189387395345846e-06, "loss": 1.2229, "step": 22079 }, { "epoch": 0.6, "learning_rate": 7.188538553783133e-06, "loss": 1.2222, "step": 22080 }, { "epoch": 0.6, "learning_rate": 7.187689734215975e-06, "loss": 1.3032, "step": 22081 }, { "epoch": 0.6, "learning_rate": 7.186840936651007e-06, "loss": 1.145, "step": 22082 }, { "epoch": 0.6, "learning_rate": 7.185992161094877e-06, "loss": 1.375, "step": 22083 }, { "epoch": 0.6, "learning_rate": 7.185143407554217e-06, "loss": 1.2485, "step": 22084 }, { "epoch": 0.6, "learning_rate": 7.18429467603567e-06, "loss": 1.0554, "step": 22085 }, { "epoch": 0.6, "learning_rate": 7.183445966545884e-06, "loss": 1.7212, "step": 22086 }, { "epoch": 0.6, "learning_rate": 7.182597279091485e-06, "loss": 1.2188, "step": 22087 }, { "epoch": 0.6, "learning_rate": 7.181748613679127e-06, "loss": 1.2269, "step": 22088 }, { "epoch": 0.6, "learning_rate": 7.180899970315437e-06, "loss": 1.3552, "step": 22089 }, { "epoch": 0.6, "learning_rate": 7.180051349007066e-06, "loss": 1.2754, "step": 22090 }, { "epoch": 0.6, "learning_rate": 7.17920274976064e-06, "loss": 1.3062, "step": 22091 }, { "epoch": 0.6, "learning_rate": 7.178354172582812e-06, "loss": 1.2407, "step": 22092 }, { "epoch": 0.6, "learning_rate": 7.177505617480207e-06, "loss": 1.2732, "step": 22093 }, { "epoch": 0.6, "learning_rate": 7.17665708445948e-06, "loss": 1.2822, "step": 22094 }, { "epoch": 0.6, "learning_rate": 7.1758085735272505e-06, "loss": 1.2915, "step": 22095 }, { "epoch": 0.6, "learning_rate": 7.174960084690175e-06, "loss": 1.1807, "step": 22096 }, { "epoch": 0.6, "learning_rate": 7.174111617954878e-06, "loss": 1.2822, "step": 22097 }, { "epoch": 0.6, "learning_rate": 7.1732631733280064e-06, "loss": 1.3413, "step": 22098 }, { "epoch": 0.6, "learning_rate": 7.1724147508161904e-06, "loss": 1.2729, "step": 22099 }, { "epoch": 0.6, "learning_rate": 7.171566350426072e-06, "loss": 1.2974, "step": 22100 }, { "epoch": 0.6, "learning_rate": 7.1707179721642916e-06, "loss": 1.6587, "step": 22101 }, { "epoch": 0.6, "learning_rate": 7.169869616037482e-06, "loss": 1.3049, "step": 22102 }, { "epoch": 0.6, "learning_rate": 7.169021282052283e-06, "loss": 1.1753, "step": 22103 }, { "epoch": 0.6, "learning_rate": 7.168172970215328e-06, "loss": 1.4307, "step": 22104 }, { "epoch": 0.6, "learning_rate": 7.167324680533259e-06, "loss": 1.229, "step": 22105 }, { "epoch": 0.6, "learning_rate": 7.166476413012706e-06, "loss": 1.2219, "step": 22106 }, { "epoch": 0.6, "learning_rate": 7.165628167660312e-06, "loss": 1.1506, "step": 22107 }, { "epoch": 0.6, "learning_rate": 7.164779944482709e-06, "loss": 1.2412, "step": 22108 }, { "epoch": 0.6, "learning_rate": 7.163931743486536e-06, "loss": 1.385, "step": 22109 }, { "epoch": 0.6, "learning_rate": 7.163083564678426e-06, "loss": 1.2622, "step": 22110 }, { "epoch": 0.6, "learning_rate": 7.162235408065018e-06, "loss": 1.2969, "step": 22111 }, { "epoch": 0.6, "learning_rate": 7.1613872736529434e-06, "loss": 1.4277, "step": 22112 }, { "epoch": 0.6, "learning_rate": 7.160539161448843e-06, "loss": 1.4028, "step": 22113 }, { "epoch": 0.6, "learning_rate": 7.159691071459345e-06, "loss": 1.2444, "step": 22114 }, { "epoch": 0.6, "learning_rate": 7.158843003691092e-06, "loss": 1.0903, "step": 22115 }, { "epoch": 0.6, "learning_rate": 7.157994958150712e-06, "loss": 1.2866, "step": 22116 }, { "epoch": 0.6, "learning_rate": 7.157146934844844e-06, "loss": 1.3674, "step": 22117 }, { "epoch": 0.6, "learning_rate": 7.156298933780124e-06, "loss": 1.2429, "step": 22118 }, { "epoch": 0.6, "learning_rate": 7.155450954963182e-06, "loss": 1.249, "step": 22119 }, { "epoch": 0.6, "learning_rate": 7.154602998400655e-06, "loss": 1.2515, "step": 22120 }, { "epoch": 0.6, "learning_rate": 7.1537550640991745e-06, "loss": 1.2815, "step": 22121 }, { "epoch": 0.6, "learning_rate": 7.1529071520653785e-06, "loss": 1.4937, "step": 22122 }, { "epoch": 0.6, "learning_rate": 7.152059262305895e-06, "loss": 1.3223, "step": 22123 }, { "epoch": 0.6, "learning_rate": 7.151211394827364e-06, "loss": 1.2759, "step": 22124 }, { "epoch": 0.6, "learning_rate": 7.150363549636412e-06, "loss": 1.3308, "step": 22125 }, { "epoch": 0.6, "learning_rate": 7.149515726739679e-06, "loss": 1.1663, "step": 22126 }, { "epoch": 0.6, "learning_rate": 7.148667926143792e-06, "loss": 1.334, "step": 22127 }, { "epoch": 0.6, "learning_rate": 7.147820147855389e-06, "loss": 1.136, "step": 22128 }, { "epoch": 0.6, "learning_rate": 7.146972391881096e-06, "loss": 1.1304, "step": 22129 }, { "epoch": 0.6, "learning_rate": 7.146124658227553e-06, "loss": 1.3386, "step": 22130 }, { "epoch": 0.6, "learning_rate": 7.145276946901387e-06, "loss": 1.3071, "step": 22131 }, { "epoch": 0.6, "learning_rate": 7.144429257909229e-06, "loss": 1.3167, "step": 22132 }, { "epoch": 0.6, "learning_rate": 7.14358159125772e-06, "loss": 1.2981, "step": 22133 }, { "epoch": 0.6, "learning_rate": 7.14273394695348e-06, "loss": 1.2175, "step": 22134 }, { "epoch": 0.6, "learning_rate": 7.141886325003151e-06, "loss": 1.427, "step": 22135 }, { "epoch": 0.6, "learning_rate": 7.141038725413354e-06, "loss": 1.1191, "step": 22136 }, { "epoch": 0.6, "learning_rate": 7.140191148190732e-06, "loss": 1.2036, "step": 22137 }, { "epoch": 0.6, "learning_rate": 7.139343593341902e-06, "loss": 1.4551, "step": 22138 }, { "epoch": 0.6, "learning_rate": 7.1384960608735095e-06, "loss": 1.2068, "step": 22139 }, { "epoch": 0.6, "learning_rate": 7.1376485507921725e-06, "loss": 1.269, "step": 22140 }, { "epoch": 0.6, "learning_rate": 7.1368010631045325e-06, "loss": 1.2617, "step": 22141 }, { "epoch": 0.6, "learning_rate": 7.135953597817209e-06, "loss": 1.1947, "step": 22142 }, { "epoch": 0.6, "learning_rate": 7.135106154936843e-06, "loss": 1.3276, "step": 22143 }, { "epoch": 0.6, "learning_rate": 7.134258734470057e-06, "loss": 1.1272, "step": 22144 }, { "epoch": 0.6, "learning_rate": 7.133411336423483e-06, "loss": 1.3503, "step": 22145 }, { "epoch": 0.6, "learning_rate": 7.132563960803751e-06, "loss": 1.3342, "step": 22146 }, { "epoch": 0.6, "learning_rate": 7.131716607617489e-06, "loss": 1.2568, "step": 22147 }, { "epoch": 0.6, "learning_rate": 7.130869276871331e-06, "loss": 1.3701, "step": 22148 }, { "epoch": 0.6, "learning_rate": 7.130021968571898e-06, "loss": 1.3909, "step": 22149 }, { "epoch": 0.6, "learning_rate": 7.129174682725828e-06, "loss": 1.2837, "step": 22150 }, { "epoch": 0.6, "learning_rate": 7.128327419339742e-06, "loss": 1.3125, "step": 22151 }, { "epoch": 0.6, "learning_rate": 7.127480178420274e-06, "loss": 1.2166, "step": 22152 }, { "epoch": 0.6, "learning_rate": 7.126632959974049e-06, "loss": 1.4316, "step": 22153 }, { "epoch": 0.61, "learning_rate": 7.125785764007698e-06, "loss": 1.2507, "step": 22154 }, { "epoch": 0.61, "learning_rate": 7.124938590527845e-06, "loss": 1.2688, "step": 22155 }, { "epoch": 0.61, "learning_rate": 7.1240914395411245e-06, "loss": 1.312, "step": 22156 }, { "epoch": 0.61, "learning_rate": 7.123244311054157e-06, "loss": 1.3547, "step": 22157 }, { "epoch": 0.61, "learning_rate": 7.1223972050735755e-06, "loss": 1.3855, "step": 22158 }, { "epoch": 0.61, "learning_rate": 7.1215501216060025e-06, "loss": 1.3657, "step": 22159 }, { "epoch": 0.61, "learning_rate": 7.120703060658071e-06, "loss": 1.3174, "step": 22160 }, { "epoch": 0.61, "learning_rate": 7.119856022236402e-06, "loss": 1.1731, "step": 22161 }, { "epoch": 0.61, "learning_rate": 7.119009006347625e-06, "loss": 1.2737, "step": 22162 }, { "epoch": 0.61, "learning_rate": 7.118162012998369e-06, "loss": 1.3606, "step": 22163 }, { "epoch": 0.61, "learning_rate": 7.117315042195256e-06, "loss": 1.2986, "step": 22164 }, { "epoch": 0.61, "learning_rate": 7.1164680939449175e-06, "loss": 1.1646, "step": 22165 }, { "epoch": 0.61, "learning_rate": 7.115621168253974e-06, "loss": 1.3147, "step": 22166 }, { "epoch": 0.61, "learning_rate": 7.114774265129057e-06, "loss": 1.2341, "step": 22167 }, { "epoch": 0.61, "learning_rate": 7.113927384576786e-06, "loss": 1.3867, "step": 22168 }, { "epoch": 0.61, "learning_rate": 7.113080526603793e-06, "loss": 1.135, "step": 22169 }, { "epoch": 0.61, "learning_rate": 7.112233691216697e-06, "loss": 1.2769, "step": 22170 }, { "epoch": 0.61, "learning_rate": 7.111386878422131e-06, "loss": 1.2966, "step": 22171 }, { "epoch": 0.61, "learning_rate": 7.1105400882267114e-06, "loss": 1.1052, "step": 22172 }, { "epoch": 0.61, "learning_rate": 7.1096933206370715e-06, "loss": 1.2317, "step": 22173 }, { "epoch": 0.61, "learning_rate": 7.108846575659829e-06, "loss": 1.4373, "step": 22174 }, { "epoch": 0.61, "learning_rate": 7.107999853301613e-06, "loss": 1.7578, "step": 22175 }, { "epoch": 0.61, "learning_rate": 7.107153153569042e-06, "loss": 1.3, "step": 22176 }, { "epoch": 0.61, "learning_rate": 7.106306476468752e-06, "loss": 1.231, "step": 22177 }, { "epoch": 0.61, "learning_rate": 7.105459822007352e-06, "loss": 1.2251, "step": 22178 }, { "epoch": 0.61, "learning_rate": 7.104613190191476e-06, "loss": 1.3896, "step": 22179 }, { "epoch": 0.61, "learning_rate": 7.1037665810277465e-06, "loss": 1.1125, "step": 22180 }, { "epoch": 0.61, "learning_rate": 7.102919994522783e-06, "loss": 1.3579, "step": 22181 }, { "epoch": 0.61, "learning_rate": 7.102073430683214e-06, "loss": 1.3157, "step": 22182 }, { "epoch": 0.61, "learning_rate": 7.101226889515657e-06, "loss": 1.377, "step": 22183 }, { "epoch": 0.61, "learning_rate": 7.100380371026741e-06, "loss": 1.3174, "step": 22184 }, { "epoch": 0.61, "learning_rate": 7.099533875223081e-06, "loss": 1.1338, "step": 22185 }, { "epoch": 0.61, "learning_rate": 7.098687402111309e-06, "loss": 1.1578, "step": 22186 }, { "epoch": 0.61, "learning_rate": 7.097840951698038e-06, "loss": 1.2505, "step": 22187 }, { "epoch": 0.61, "learning_rate": 7.0969945239898975e-06, "loss": 1.176, "step": 22188 }, { "epoch": 0.61, "learning_rate": 7.096148118993505e-06, "loss": 1.2019, "step": 22189 }, { "epoch": 0.61, "learning_rate": 7.095301736715488e-06, "loss": 1.3716, "step": 22190 }, { "epoch": 0.61, "learning_rate": 7.094455377162459e-06, "loss": 1.1736, "step": 22191 }, { "epoch": 0.61, "learning_rate": 7.093609040341049e-06, "loss": 1.318, "step": 22192 }, { "epoch": 0.61, "learning_rate": 7.092762726257872e-06, "loss": 1.2363, "step": 22193 }, { "epoch": 0.61, "learning_rate": 7.091916434919553e-06, "loss": 1.2695, "step": 22194 }, { "epoch": 0.61, "learning_rate": 7.091070166332714e-06, "loss": 1.24, "step": 22195 }, { "epoch": 0.61, "learning_rate": 7.0902239205039734e-06, "loss": 1.2468, "step": 22196 }, { "epoch": 0.61, "learning_rate": 7.089377697439953e-06, "loss": 1.0645, "step": 22197 }, { "epoch": 0.61, "learning_rate": 7.0885314971472704e-06, "loss": 1.1482, "step": 22198 }, { "epoch": 0.61, "learning_rate": 7.087685319632552e-06, "loss": 1.1934, "step": 22199 }, { "epoch": 0.61, "learning_rate": 7.086839164902413e-06, "loss": 1.8506, "step": 22200 }, { "epoch": 0.61, "learning_rate": 7.085993032963474e-06, "loss": 1.2292, "step": 22201 }, { "epoch": 0.61, "learning_rate": 7.085146923822355e-06, "loss": 1.2966, "step": 22202 }, { "epoch": 0.61, "learning_rate": 7.084300837485676e-06, "loss": 1.3599, "step": 22203 }, { "epoch": 0.61, "learning_rate": 7.083454773960055e-06, "loss": 1.3542, "step": 22204 }, { "epoch": 0.61, "learning_rate": 7.082608733252115e-06, "loss": 1.3433, "step": 22205 }, { "epoch": 0.61, "learning_rate": 7.0817627153684696e-06, "loss": 1.2881, "step": 22206 }, { "epoch": 0.61, "learning_rate": 7.080916720315743e-06, "loss": 1.3286, "step": 22207 }, { "epoch": 0.61, "learning_rate": 7.080070748100549e-06, "loss": 1.4619, "step": 22208 }, { "epoch": 0.61, "learning_rate": 7.079224798729507e-06, "loss": 1.2451, "step": 22209 }, { "epoch": 0.61, "learning_rate": 7.078378872209243e-06, "loss": 1.3687, "step": 22210 }, { "epoch": 0.61, "learning_rate": 7.077532968546361e-06, "loss": 1.376, "step": 22211 }, { "epoch": 0.61, "learning_rate": 7.076687087747496e-06, "loss": 1.3662, "step": 22212 }, { "epoch": 0.61, "learning_rate": 7.075841229819247e-06, "loss": 1.4128, "step": 22213 }, { "epoch": 0.61, "learning_rate": 7.07499539476825e-06, "loss": 1.3025, "step": 22214 }, { "epoch": 0.61, "learning_rate": 7.0741495826011065e-06, "loss": 1.4199, "step": 22215 }, { "epoch": 0.61, "learning_rate": 7.073303793324446e-06, "loss": 1.0854, "step": 22216 }, { "epoch": 0.61, "learning_rate": 7.072458026944875e-06, "loss": 1.2444, "step": 22217 }, { "epoch": 0.61, "learning_rate": 7.0716122834690224e-06, "loss": 1.2947, "step": 22218 }, { "epoch": 0.61, "learning_rate": 7.070766562903492e-06, "loss": 1.1704, "step": 22219 }, { "epoch": 0.61, "learning_rate": 7.0699208652549125e-06, "loss": 1.6851, "step": 22220 }, { "epoch": 0.61, "learning_rate": 7.069075190529888e-06, "loss": 1.2493, "step": 22221 }, { "epoch": 0.61, "learning_rate": 7.068229538735047e-06, "loss": 1.118, "step": 22222 }, { "epoch": 0.61, "learning_rate": 7.067383909876994e-06, "loss": 1.2131, "step": 22223 }, { "epoch": 0.61, "learning_rate": 7.066538303962351e-06, "loss": 1.7485, "step": 22224 }, { "epoch": 0.61, "learning_rate": 7.065692720997737e-06, "loss": 1.2632, "step": 22225 }, { "epoch": 0.61, "learning_rate": 7.064847160989759e-06, "loss": 1.3259, "step": 22226 }, { "epoch": 0.61, "learning_rate": 7.064001623945041e-06, "loss": 1.2136, "step": 22227 }, { "epoch": 0.61, "learning_rate": 7.06315610987019e-06, "loss": 1.4075, "step": 22228 }, { "epoch": 0.61, "learning_rate": 7.062310618771827e-06, "loss": 1.3542, "step": 22229 }, { "epoch": 0.61, "learning_rate": 7.061465150656562e-06, "loss": 1.1672, "step": 22230 }, { "epoch": 0.61, "learning_rate": 7.0606197055310156e-06, "loss": 1.4631, "step": 22231 }, { "epoch": 0.61, "learning_rate": 7.059774283401795e-06, "loss": 1.3135, "step": 22232 }, { "epoch": 0.61, "learning_rate": 7.05892888427552e-06, "loss": 1.4526, "step": 22233 }, { "epoch": 0.61, "learning_rate": 7.058083508158799e-06, "loss": 1.2126, "step": 22234 }, { "epoch": 0.61, "learning_rate": 7.0572381550582526e-06, "loss": 1.26, "step": 22235 }, { "epoch": 0.61, "learning_rate": 7.056392824980489e-06, "loss": 1.2292, "step": 22236 }, { "epoch": 0.61, "learning_rate": 7.055547517932127e-06, "loss": 1.3508, "step": 22237 }, { "epoch": 0.61, "learning_rate": 7.054702233919772e-06, "loss": 1.4705, "step": 22238 }, { "epoch": 0.61, "learning_rate": 7.053856972950046e-06, "loss": 1.3755, "step": 22239 }, { "epoch": 0.61, "learning_rate": 7.0530117350295555e-06, "loss": 1.2947, "step": 22240 }, { "epoch": 0.61, "learning_rate": 7.052166520164914e-06, "loss": 1.1951, "step": 22241 }, { "epoch": 0.61, "learning_rate": 7.051321328362739e-06, "loss": 1.1482, "step": 22242 }, { "epoch": 0.61, "learning_rate": 7.050476159629635e-06, "loss": 1.2549, "step": 22243 }, { "epoch": 0.61, "learning_rate": 7.0496310139722235e-06, "loss": 1.3694, "step": 22244 }, { "epoch": 0.61, "learning_rate": 7.048785891397108e-06, "loss": 1.3003, "step": 22245 }, { "epoch": 0.61, "learning_rate": 7.047940791910907e-06, "loss": 1.2434, "step": 22246 }, { "epoch": 0.61, "learning_rate": 7.047095715520226e-06, "loss": 1.4673, "step": 22247 }, { "epoch": 0.61, "learning_rate": 7.046250662231682e-06, "loss": 1.1411, "step": 22248 }, { "epoch": 0.61, "learning_rate": 7.04540563205188e-06, "loss": 1.0994, "step": 22249 }, { "epoch": 0.61, "learning_rate": 7.04456062498744e-06, "loss": 1.2839, "step": 22250 }, { "epoch": 0.61, "learning_rate": 7.043715641044965e-06, "loss": 1.3376, "step": 22251 }, { "epoch": 0.61, "learning_rate": 7.04287068023107e-06, "loss": 1.2332, "step": 22252 }, { "epoch": 0.61, "learning_rate": 7.042025742552363e-06, "loss": 1.1355, "step": 22253 }, { "epoch": 0.61, "learning_rate": 7.041180828015457e-06, "loss": 1.3625, "step": 22254 }, { "epoch": 0.61, "learning_rate": 7.040335936626959e-06, "loss": 1.3757, "step": 22255 }, { "epoch": 0.61, "learning_rate": 7.0394910683934785e-06, "loss": 1.2456, "step": 22256 }, { "epoch": 0.61, "learning_rate": 7.038646223321635e-06, "loss": 1.3242, "step": 22257 }, { "epoch": 0.61, "learning_rate": 7.037801401418024e-06, "loss": 1.3005, "step": 22258 }, { "epoch": 0.61, "learning_rate": 7.0369566026892684e-06, "loss": 1.2888, "step": 22259 }, { "epoch": 0.61, "learning_rate": 7.0361118271419645e-06, "loss": 1.1858, "step": 22260 }, { "epoch": 0.61, "learning_rate": 7.035267074782735e-06, "loss": 1.3062, "step": 22261 }, { "epoch": 0.61, "learning_rate": 7.034422345618174e-06, "loss": 1.3875, "step": 22262 }, { "epoch": 0.61, "learning_rate": 7.033577639654905e-06, "loss": 1.1554, "step": 22263 }, { "epoch": 0.61, "learning_rate": 7.032732956899524e-06, "loss": 1.2749, "step": 22264 }, { "epoch": 0.61, "learning_rate": 7.031888297358651e-06, "loss": 1.1616, "step": 22265 }, { "epoch": 0.61, "learning_rate": 7.031043661038881e-06, "loss": 1.3325, "step": 22266 }, { "epoch": 0.61, "learning_rate": 7.030199047946838e-06, "loss": 1.2866, "step": 22267 }, { "epoch": 0.61, "learning_rate": 7.029354458089112e-06, "loss": 1.2908, "step": 22268 }, { "epoch": 0.61, "learning_rate": 7.028509891472327e-06, "loss": 1.3101, "step": 22269 }, { "epoch": 0.61, "learning_rate": 7.027665348103078e-06, "loss": 1.2444, "step": 22270 }, { "epoch": 0.61, "learning_rate": 7.026820827987979e-06, "loss": 1.3127, "step": 22271 }, { "epoch": 0.61, "learning_rate": 7.025976331133637e-06, "loss": 1.3486, "step": 22272 }, { "epoch": 0.61, "learning_rate": 7.025131857546656e-06, "loss": 1.3682, "step": 22273 }, { "epoch": 0.61, "learning_rate": 7.024287407233648e-06, "loss": 1.2573, "step": 22274 }, { "epoch": 0.61, "learning_rate": 7.0234429802012135e-06, "loss": 1.3088, "step": 22275 }, { "epoch": 0.61, "learning_rate": 7.022598576455963e-06, "loss": 1.2329, "step": 22276 }, { "epoch": 0.61, "learning_rate": 7.0217541960045e-06, "loss": 1.2954, "step": 22277 }, { "epoch": 0.61, "learning_rate": 7.020909838853433e-06, "loss": 1.2129, "step": 22278 }, { "epoch": 0.61, "learning_rate": 7.0200655050093636e-06, "loss": 1.001, "step": 22279 }, { "epoch": 0.61, "learning_rate": 7.019221194478903e-06, "loss": 1.3687, "step": 22280 }, { "epoch": 0.61, "learning_rate": 7.018376907268653e-06, "loss": 1.2412, "step": 22281 }, { "epoch": 0.61, "learning_rate": 7.0175326433852205e-06, "loss": 1.3274, "step": 22282 }, { "epoch": 0.61, "learning_rate": 7.01668840283521e-06, "loss": 1.3318, "step": 22283 }, { "epoch": 0.61, "learning_rate": 7.015844185625227e-06, "loss": 1.3606, "step": 22284 }, { "epoch": 0.61, "learning_rate": 7.014999991761875e-06, "loss": 1.2971, "step": 22285 }, { "epoch": 0.61, "learning_rate": 7.014155821251759e-06, "loss": 1.3318, "step": 22286 }, { "epoch": 0.61, "learning_rate": 7.0133116741014864e-06, "loss": 1.3127, "step": 22287 }, { "epoch": 0.61, "learning_rate": 7.012467550317656e-06, "loss": 1.2446, "step": 22288 }, { "epoch": 0.61, "learning_rate": 7.011623449906877e-06, "loss": 1.2917, "step": 22289 }, { "epoch": 0.61, "learning_rate": 7.010779372875748e-06, "loss": 1.3459, "step": 22290 }, { "epoch": 0.61, "learning_rate": 7.009935319230879e-06, "loss": 1.3555, "step": 22291 }, { "epoch": 0.61, "learning_rate": 7.009091288978866e-06, "loss": 1.2686, "step": 22292 }, { "epoch": 0.61, "learning_rate": 7.00824728212632e-06, "loss": 1.261, "step": 22293 }, { "epoch": 0.61, "learning_rate": 7.007403298679838e-06, "loss": 1.083, "step": 22294 }, { "epoch": 0.61, "learning_rate": 7.006559338646028e-06, "loss": 1.6885, "step": 22295 }, { "epoch": 0.61, "learning_rate": 7.005715402031488e-06, "loss": 1.3892, "step": 22296 }, { "epoch": 0.61, "learning_rate": 7.004871488842824e-06, "loss": 1.2786, "step": 22297 }, { "epoch": 0.61, "learning_rate": 7.004027599086635e-06, "loss": 1.3145, "step": 22298 }, { "epoch": 0.61, "learning_rate": 7.003183732769528e-06, "loss": 1.3267, "step": 22299 }, { "epoch": 0.61, "learning_rate": 7.0023398898981e-06, "loss": 1.252, "step": 22300 }, { "epoch": 0.61, "learning_rate": 7.001496070478957e-06, "loss": 1.3091, "step": 22301 }, { "epoch": 0.61, "learning_rate": 7.000652274518696e-06, "loss": 1.4229, "step": 22302 }, { "epoch": 0.61, "learning_rate": 6.999808502023919e-06, "loss": 1.2532, "step": 22303 }, { "epoch": 0.61, "learning_rate": 6.998964753001237e-06, "loss": 1.2869, "step": 22304 }, { "epoch": 0.61, "learning_rate": 6.998121027457238e-06, "loss": 1.1907, "step": 22305 }, { "epoch": 0.61, "learning_rate": 6.997277325398533e-06, "loss": 1.373, "step": 22306 }, { "epoch": 0.61, "learning_rate": 6.996433646831713e-06, "loss": 1.3174, "step": 22307 }, { "epoch": 0.61, "learning_rate": 6.9955899917633895e-06, "loss": 1.373, "step": 22308 }, { "epoch": 0.61, "learning_rate": 6.994746360200151e-06, "loss": 1.3569, "step": 22309 }, { "epoch": 0.61, "learning_rate": 6.993902752148609e-06, "loss": 1.3743, "step": 22310 }, { "epoch": 0.61, "learning_rate": 6.993059167615354e-06, "loss": 1.2866, "step": 22311 }, { "epoch": 0.61, "learning_rate": 6.9922156066069955e-06, "loss": 1.4116, "step": 22312 }, { "epoch": 0.61, "learning_rate": 6.991372069130121e-06, "loss": 1.2563, "step": 22313 }, { "epoch": 0.61, "learning_rate": 6.990528555191344e-06, "loss": 1.3132, "step": 22314 }, { "epoch": 0.61, "learning_rate": 6.989685064797249e-06, "loss": 1.4229, "step": 22315 }, { "epoch": 0.61, "learning_rate": 6.98884159795445e-06, "loss": 1.2651, "step": 22316 }, { "epoch": 0.61, "learning_rate": 6.987998154669531e-06, "loss": 1.3137, "step": 22317 }, { "epoch": 0.61, "learning_rate": 6.9871547349491005e-06, "loss": 1.1794, "step": 22318 }, { "epoch": 0.61, "learning_rate": 6.986311338799757e-06, "loss": 1.3022, "step": 22319 }, { "epoch": 0.61, "learning_rate": 6.9854679662280945e-06, "loss": 1.3816, "step": 22320 }, { "epoch": 0.61, "learning_rate": 6.984624617240714e-06, "loss": 1.1143, "step": 22321 }, { "epoch": 0.61, "learning_rate": 6.9837812918442114e-06, "loss": 1.2759, "step": 22322 }, { "epoch": 0.61, "learning_rate": 6.982937990045189e-06, "loss": 1.4746, "step": 22323 }, { "epoch": 0.61, "learning_rate": 6.982094711850237e-06, "loss": 1.3086, "step": 22324 }, { "epoch": 0.61, "learning_rate": 6.98125145726596e-06, "loss": 1.2161, "step": 22325 }, { "epoch": 0.61, "learning_rate": 6.980408226298949e-06, "loss": 1.3467, "step": 22326 }, { "epoch": 0.61, "learning_rate": 6.979565018955807e-06, "loss": 1.3196, "step": 22327 }, { "epoch": 0.61, "learning_rate": 6.978721835243125e-06, "loss": 1.4038, "step": 22328 }, { "epoch": 0.61, "learning_rate": 6.977878675167506e-06, "loss": 1.2202, "step": 22329 }, { "epoch": 0.61, "learning_rate": 6.977035538735541e-06, "loss": 1.2747, "step": 22330 }, { "epoch": 0.61, "learning_rate": 6.9761924259538296e-06, "loss": 1.2478, "step": 22331 }, { "epoch": 0.61, "learning_rate": 6.975349336828965e-06, "loss": 1.1868, "step": 22332 }, { "epoch": 0.61, "learning_rate": 6.974506271367545e-06, "loss": 1.2563, "step": 22333 }, { "epoch": 0.61, "learning_rate": 6.973663229576167e-06, "loss": 1.2366, "step": 22334 }, { "epoch": 0.61, "learning_rate": 6.972820211461424e-06, "loss": 1.1936, "step": 22335 }, { "epoch": 0.61, "learning_rate": 6.971977217029912e-06, "loss": 1.3333, "step": 22336 }, { "epoch": 0.61, "learning_rate": 6.971134246288227e-06, "loss": 1.2571, "step": 22337 }, { "epoch": 0.61, "learning_rate": 6.970291299242964e-06, "loss": 1.1323, "step": 22338 }, { "epoch": 0.61, "learning_rate": 6.969448375900715e-06, "loss": 1.1849, "step": 22339 }, { "epoch": 0.61, "learning_rate": 6.968605476268079e-06, "loss": 1.4551, "step": 22340 }, { "epoch": 0.61, "learning_rate": 6.967762600351646e-06, "loss": 1.4885, "step": 22341 }, { "epoch": 0.61, "learning_rate": 6.966919748158015e-06, "loss": 1.3032, "step": 22342 }, { "epoch": 0.61, "learning_rate": 6.966076919693776e-06, "loss": 1.7056, "step": 22343 }, { "epoch": 0.61, "learning_rate": 6.965234114965527e-06, "loss": 1.2891, "step": 22344 }, { "epoch": 0.61, "learning_rate": 6.964391333979855e-06, "loss": 1.1421, "step": 22345 }, { "epoch": 0.61, "learning_rate": 6.9635485767433616e-06, "loss": 1.248, "step": 22346 }, { "epoch": 0.61, "learning_rate": 6.962705843262634e-06, "loss": 1.166, "step": 22347 }, { "epoch": 0.61, "learning_rate": 6.961863133544265e-06, "loss": 1.2703, "step": 22348 }, { "epoch": 0.61, "learning_rate": 6.961020447594857e-06, "loss": 1.1213, "step": 22349 }, { "epoch": 0.61, "learning_rate": 6.96017778542099e-06, "loss": 1.2026, "step": 22350 }, { "epoch": 0.61, "learning_rate": 6.959335147029267e-06, "loss": 1.3984, "step": 22351 }, { "epoch": 0.61, "learning_rate": 6.958492532426271e-06, "loss": 1.3022, "step": 22352 }, { "epoch": 0.61, "learning_rate": 6.957649941618606e-06, "loss": 1.126, "step": 22353 }, { "epoch": 0.61, "learning_rate": 6.95680737461285e-06, "loss": 1.4353, "step": 22354 }, { "epoch": 0.61, "learning_rate": 6.955964831415609e-06, "loss": 1.2, "step": 22355 }, { "epoch": 0.61, "learning_rate": 6.955122312033462e-06, "loss": 1.3369, "step": 22356 }, { "epoch": 0.61, "learning_rate": 6.954279816473012e-06, "loss": 1.2598, "step": 22357 }, { "epoch": 0.61, "learning_rate": 6.953437344740839e-06, "loss": 1.2964, "step": 22358 }, { "epoch": 0.61, "learning_rate": 6.952594896843544e-06, "loss": 1.2466, "step": 22359 }, { "epoch": 0.61, "learning_rate": 6.951752472787708e-06, "loss": 1.2576, "step": 22360 }, { "epoch": 0.61, "learning_rate": 6.950910072579935e-06, "loss": 1.3018, "step": 22361 }, { "epoch": 0.61, "learning_rate": 6.9500676962267985e-06, "loss": 1.3562, "step": 22362 }, { "epoch": 0.61, "learning_rate": 6.9492253437349066e-06, "loss": 1.1299, "step": 22363 }, { "epoch": 0.61, "learning_rate": 6.948383015110835e-06, "loss": 1.2427, "step": 22364 }, { "epoch": 0.61, "learning_rate": 6.947540710361181e-06, "loss": 1.3198, "step": 22365 }, { "epoch": 0.61, "learning_rate": 6.946698429492535e-06, "loss": 1.4092, "step": 22366 }, { "epoch": 0.61, "learning_rate": 6.945856172511485e-06, "loss": 1.1499, "step": 22367 }, { "epoch": 0.61, "learning_rate": 6.94501393942462e-06, "loss": 1.4392, "step": 22368 }, { "epoch": 0.61, "learning_rate": 6.944171730238527e-06, "loss": 1.2527, "step": 22369 }, { "epoch": 0.61, "learning_rate": 6.943329544959801e-06, "loss": 1.7061, "step": 22370 }, { "epoch": 0.61, "learning_rate": 6.942487383595023e-06, "loss": 1.135, "step": 22371 }, { "epoch": 0.61, "learning_rate": 6.94164524615079e-06, "loss": 1.1335, "step": 22372 }, { "epoch": 0.61, "learning_rate": 6.9408031326336844e-06, "loss": 1.2878, "step": 22373 }, { "epoch": 0.61, "learning_rate": 6.9399610430502975e-06, "loss": 1.0854, "step": 22374 }, { "epoch": 0.61, "learning_rate": 6.939118977407215e-06, "loss": 1.1843, "step": 22375 }, { "epoch": 0.61, "learning_rate": 6.938276935711028e-06, "loss": 1.3044, "step": 22376 }, { "epoch": 0.61, "learning_rate": 6.937434917968321e-06, "loss": 1.355, "step": 22377 }, { "epoch": 0.61, "learning_rate": 6.936592924185686e-06, "loss": 1.4165, "step": 22378 }, { "epoch": 0.61, "learning_rate": 6.935750954369703e-06, "loss": 1.3015, "step": 22379 }, { "epoch": 0.61, "learning_rate": 6.9349090085269645e-06, "loss": 1.302, "step": 22380 }, { "epoch": 0.61, "learning_rate": 6.93406708666406e-06, "loss": 1.2156, "step": 22381 }, { "epoch": 0.61, "learning_rate": 6.933225188787569e-06, "loss": 1.2351, "step": 22382 }, { "epoch": 0.61, "learning_rate": 6.932383314904085e-06, "loss": 1.416, "step": 22383 }, { "epoch": 0.61, "learning_rate": 6.93154146502019e-06, "loss": 1.186, "step": 22384 }, { "epoch": 0.61, "learning_rate": 6.930699639142473e-06, "loss": 1.248, "step": 22385 }, { "epoch": 0.61, "learning_rate": 6.929857837277516e-06, "loss": 1.688, "step": 22386 }, { "epoch": 0.61, "learning_rate": 6.929016059431911e-06, "loss": 1.1931, "step": 22387 }, { "epoch": 0.61, "learning_rate": 6.928174305612238e-06, "loss": 1.2441, "step": 22388 }, { "epoch": 0.61, "learning_rate": 6.927332575825086e-06, "loss": 1.3242, "step": 22389 }, { "epoch": 0.61, "learning_rate": 6.926490870077038e-06, "loss": 1.4158, "step": 22390 }, { "epoch": 0.61, "learning_rate": 6.925649188374681e-06, "loss": 1.3943, "step": 22391 }, { "epoch": 0.61, "learning_rate": 6.924807530724599e-06, "loss": 1.2822, "step": 22392 }, { "epoch": 0.61, "learning_rate": 6.923965897133378e-06, "loss": 1.1538, "step": 22393 }, { "epoch": 0.61, "learning_rate": 6.923124287607599e-06, "loss": 1.2625, "step": 22394 }, { "epoch": 0.61, "learning_rate": 6.9222827021538465e-06, "loss": 1.3433, "step": 22395 }, { "epoch": 0.61, "learning_rate": 6.921441140778713e-06, "loss": 1.3057, "step": 22396 }, { "epoch": 0.61, "learning_rate": 6.920599603488769e-06, "loss": 1.2798, "step": 22397 }, { "epoch": 0.61, "learning_rate": 6.919758090290613e-06, "loss": 1.157, "step": 22398 }, { "epoch": 0.61, "learning_rate": 6.918916601190817e-06, "loss": 1.2351, "step": 22399 }, { "epoch": 0.61, "learning_rate": 6.9180751361959716e-06, "loss": 1.3684, "step": 22400 }, { "epoch": 0.61, "learning_rate": 6.917233695312653e-06, "loss": 1.2854, "step": 22401 }, { "epoch": 0.61, "learning_rate": 6.916392278547455e-06, "loss": 1.1559, "step": 22402 }, { "epoch": 0.61, "learning_rate": 6.915550885906945e-06, "loss": 1.2446, "step": 22403 }, { "epoch": 0.61, "learning_rate": 6.914709517397724e-06, "loss": 1.3704, "step": 22404 }, { "epoch": 0.61, "learning_rate": 6.913868173026357e-06, "loss": 1.228, "step": 22405 }, { "epoch": 0.61, "learning_rate": 6.91302685279944e-06, "loss": 1.1733, "step": 22406 }, { "epoch": 0.61, "learning_rate": 6.912185556723543e-06, "loss": 1.2178, "step": 22407 }, { "epoch": 0.61, "learning_rate": 6.911344284805259e-06, "loss": 1.1761, "step": 22408 }, { "epoch": 0.61, "learning_rate": 6.910503037051164e-06, "loss": 1.6714, "step": 22409 }, { "epoch": 0.61, "learning_rate": 6.909661813467839e-06, "loss": 1.3049, "step": 22410 }, { "epoch": 0.61, "learning_rate": 6.908820614061868e-06, "loss": 1.2217, "step": 22411 }, { "epoch": 0.61, "learning_rate": 6.9079794388398305e-06, "loss": 1.4487, "step": 22412 }, { "epoch": 0.61, "learning_rate": 6.907138287808309e-06, "loss": 1.2244, "step": 22413 }, { "epoch": 0.61, "learning_rate": 6.906297160973883e-06, "loss": 1.4165, "step": 22414 }, { "epoch": 0.61, "learning_rate": 6.905456058343133e-06, "loss": 1.2141, "step": 22415 }, { "epoch": 0.61, "learning_rate": 6.904614979922638e-06, "loss": 1.2595, "step": 22416 }, { "epoch": 0.61, "learning_rate": 6.903773925718982e-06, "loss": 1.3657, "step": 22417 }, { "epoch": 0.61, "learning_rate": 6.902932895738741e-06, "loss": 1.1284, "step": 22418 }, { "epoch": 0.61, "learning_rate": 6.9020918899885e-06, "loss": 1.4082, "step": 22419 }, { "epoch": 0.61, "learning_rate": 6.901250908474833e-06, "loss": 1.3169, "step": 22420 }, { "epoch": 0.61, "learning_rate": 6.900409951204321e-06, "loss": 1.335, "step": 22421 }, { "epoch": 0.61, "learning_rate": 6.899569018183545e-06, "loss": 1.4131, "step": 22422 }, { "epoch": 0.61, "learning_rate": 6.898728109419084e-06, "loss": 1.3506, "step": 22423 }, { "epoch": 0.61, "learning_rate": 6.897887224917514e-06, "loss": 1.2361, "step": 22424 }, { "epoch": 0.61, "learning_rate": 6.897046364685417e-06, "loss": 1.2063, "step": 22425 }, { "epoch": 0.61, "learning_rate": 6.89620552872937e-06, "loss": 1.2573, "step": 22426 }, { "epoch": 0.61, "learning_rate": 6.895364717055949e-06, "loss": 1.2183, "step": 22427 }, { "epoch": 0.61, "learning_rate": 6.894523929671737e-06, "loss": 1.2488, "step": 22428 }, { "epoch": 0.61, "learning_rate": 6.893683166583309e-06, "loss": 1.2527, "step": 22429 }, { "epoch": 0.61, "learning_rate": 6.892842427797244e-06, "loss": 1.2585, "step": 22430 }, { "epoch": 0.61, "learning_rate": 6.8920017133201175e-06, "loss": 1.2219, "step": 22431 }, { "epoch": 0.61, "learning_rate": 6.89116102315851e-06, "loss": 1.1843, "step": 22432 }, { "epoch": 0.61, "learning_rate": 6.890320357318993e-06, "loss": 1.1968, "step": 22433 }, { "epoch": 0.61, "learning_rate": 6.889479715808152e-06, "loss": 1.2415, "step": 22434 }, { "epoch": 0.61, "learning_rate": 6.8886390986325555e-06, "loss": 1.4019, "step": 22435 }, { "epoch": 0.61, "learning_rate": 6.887798505798786e-06, "loss": 1.4294, "step": 22436 }, { "epoch": 0.61, "learning_rate": 6.886957937313415e-06, "loss": 1.3447, "step": 22437 }, { "epoch": 0.61, "learning_rate": 6.886117393183025e-06, "loss": 1.2166, "step": 22438 }, { "epoch": 0.61, "learning_rate": 6.885276873414184e-06, "loss": 1.3091, "step": 22439 }, { "epoch": 0.61, "learning_rate": 6.884436378013475e-06, "loss": 1.3005, "step": 22440 }, { "epoch": 0.61, "learning_rate": 6.883595906987467e-06, "loss": 1.3333, "step": 22441 }, { "epoch": 0.61, "learning_rate": 6.88275546034274e-06, "loss": 1.2434, "step": 22442 }, { "epoch": 0.61, "learning_rate": 6.881915038085874e-06, "loss": 1.2007, "step": 22443 }, { "epoch": 0.61, "learning_rate": 6.881074640223433e-06, "loss": 1.4021, "step": 22444 }, { "epoch": 0.61, "learning_rate": 6.880234266762e-06, "loss": 1.0817, "step": 22445 }, { "epoch": 0.61, "learning_rate": 6.879393917708146e-06, "loss": 1.1858, "step": 22446 }, { "epoch": 0.61, "learning_rate": 6.878553593068448e-06, "loss": 1.3271, "step": 22447 }, { "epoch": 0.61, "learning_rate": 6.877713292849476e-06, "loss": 1.2458, "step": 22448 }, { "epoch": 0.61, "learning_rate": 6.87687301705781e-06, "loss": 1.2371, "step": 22449 }, { "epoch": 0.61, "learning_rate": 6.8760327657000194e-06, "loss": 1.1858, "step": 22450 }, { "epoch": 0.61, "learning_rate": 6.87519253878268e-06, "loss": 1.2275, "step": 22451 }, { "epoch": 0.61, "learning_rate": 6.874352336312364e-06, "loss": 1.2214, "step": 22452 }, { "epoch": 0.61, "learning_rate": 6.873512158295647e-06, "loss": 1.2805, "step": 22453 }, { "epoch": 0.61, "learning_rate": 6.8726720047391e-06, "loss": 1.1807, "step": 22454 }, { "epoch": 0.61, "learning_rate": 6.871831875649297e-06, "loss": 1.2021, "step": 22455 }, { "epoch": 0.61, "learning_rate": 6.870991771032809e-06, "loss": 1.2207, "step": 22456 }, { "epoch": 0.61, "learning_rate": 6.87015169089621e-06, "loss": 1.4045, "step": 22457 }, { "epoch": 0.61, "learning_rate": 6.8693116352460745e-06, "loss": 1.1895, "step": 22458 }, { "epoch": 0.61, "learning_rate": 6.868471604088971e-06, "loss": 1.2556, "step": 22459 }, { "epoch": 0.61, "learning_rate": 6.867631597431475e-06, "loss": 1.2253, "step": 22460 }, { "epoch": 0.61, "learning_rate": 6.8667916152801526e-06, "loss": 1.2134, "step": 22461 }, { "epoch": 0.61, "learning_rate": 6.865951657641583e-06, "loss": 1.2065, "step": 22462 }, { "epoch": 0.61, "learning_rate": 6.865111724522332e-06, "loss": 1.3735, "step": 22463 }, { "epoch": 0.61, "learning_rate": 6.864271815928974e-06, "loss": 1.2839, "step": 22464 }, { "epoch": 0.61, "learning_rate": 6.863431931868078e-06, "loss": 1.2341, "step": 22465 }, { "epoch": 0.61, "learning_rate": 6.862592072346217e-06, "loss": 1.2231, "step": 22466 }, { "epoch": 0.61, "learning_rate": 6.861752237369957e-06, "loss": 1.3757, "step": 22467 }, { "epoch": 0.61, "learning_rate": 6.860912426945876e-06, "loss": 1.1106, "step": 22468 }, { "epoch": 0.61, "learning_rate": 6.860072641080537e-06, "loss": 1.249, "step": 22469 }, { "epoch": 0.61, "learning_rate": 6.859232879780515e-06, "loss": 1.3027, "step": 22470 }, { "epoch": 0.61, "learning_rate": 6.858393143052375e-06, "loss": 1.2104, "step": 22471 }, { "epoch": 0.61, "learning_rate": 6.8575534309026915e-06, "loss": 1.3516, "step": 22472 }, { "epoch": 0.61, "learning_rate": 6.856713743338033e-06, "loss": 1.3164, "step": 22473 }, { "epoch": 0.61, "learning_rate": 6.855874080364966e-06, "loss": 1.3335, "step": 22474 }, { "epoch": 0.61, "learning_rate": 6.855034441990066e-06, "loss": 1.0038, "step": 22475 }, { "epoch": 0.61, "learning_rate": 6.854194828219892e-06, "loss": 1.3066, "step": 22476 }, { "epoch": 0.61, "learning_rate": 6.853355239061026e-06, "loss": 1.335, "step": 22477 }, { "epoch": 0.61, "learning_rate": 6.8525156745200206e-06, "loss": 1.4106, "step": 22478 }, { "epoch": 0.61, "learning_rate": 6.85167613460346e-06, "loss": 1.3198, "step": 22479 }, { "epoch": 0.61, "learning_rate": 6.850836619317898e-06, "loss": 1.1814, "step": 22480 }, { "epoch": 0.61, "learning_rate": 6.849997128669916e-06, "loss": 1.3726, "step": 22481 }, { "epoch": 0.61, "learning_rate": 6.849157662666068e-06, "loss": 1.3242, "step": 22482 }, { "epoch": 0.61, "learning_rate": 6.848318221312937e-06, "loss": 1.3228, "step": 22483 }, { "epoch": 0.61, "learning_rate": 6.8474788046170735e-06, "loss": 1.3423, "step": 22484 }, { "epoch": 0.61, "learning_rate": 6.846639412585062e-06, "loss": 1.3367, "step": 22485 }, { "epoch": 0.61, "learning_rate": 6.845800045223454e-06, "loss": 1.3298, "step": 22486 }, { "epoch": 0.61, "learning_rate": 6.8449607025388295e-06, "loss": 1.2732, "step": 22487 }, { "epoch": 0.61, "learning_rate": 6.844121384537742e-06, "loss": 1.3765, "step": 22488 }, { "epoch": 0.61, "learning_rate": 6.843282091226767e-06, "loss": 1.2214, "step": 22489 }, { "epoch": 0.61, "learning_rate": 6.842442822612471e-06, "loss": 1.3364, "step": 22490 }, { "epoch": 0.61, "learning_rate": 6.841603578701416e-06, "loss": 1.2493, "step": 22491 }, { "epoch": 0.61, "learning_rate": 6.84076435950017e-06, "loss": 1.2188, "step": 22492 }, { "epoch": 0.61, "learning_rate": 6.8399251650152975e-06, "loss": 1.1643, "step": 22493 }, { "epoch": 0.61, "learning_rate": 6.839085995253365e-06, "loss": 1.3066, "step": 22494 }, { "epoch": 0.61, "learning_rate": 6.838246850220938e-06, "loss": 1.3655, "step": 22495 }, { "epoch": 0.61, "learning_rate": 6.83740772992458e-06, "loss": 1.1948, "step": 22496 }, { "epoch": 0.61, "learning_rate": 6.836568634370856e-06, "loss": 1.3003, "step": 22497 }, { "epoch": 0.61, "learning_rate": 6.835729563566333e-06, "loss": 1.3123, "step": 22498 }, { "epoch": 0.61, "learning_rate": 6.834890517517572e-06, "loss": 1.1177, "step": 22499 }, { "epoch": 0.61, "learning_rate": 6.834051496231142e-06, "loss": 1.2891, "step": 22500 }, { "epoch": 0.61, "learning_rate": 6.833212499713602e-06, "loss": 1.3042, "step": 22501 }, { "epoch": 0.61, "learning_rate": 6.832373527971521e-06, "loss": 1.1831, "step": 22502 }, { "epoch": 0.61, "learning_rate": 6.831534581011457e-06, "loss": 1.2512, "step": 22503 }, { "epoch": 0.61, "learning_rate": 6.830695658839976e-06, "loss": 1.3704, "step": 22504 }, { "epoch": 0.61, "learning_rate": 6.8298567614636444e-06, "loss": 1.2239, "step": 22505 }, { "epoch": 0.61, "learning_rate": 6.82901788888902e-06, "loss": 1.3818, "step": 22506 }, { "epoch": 0.61, "learning_rate": 6.828179041122672e-06, "loss": 1.2207, "step": 22507 }, { "epoch": 0.61, "learning_rate": 6.827340218171156e-06, "loss": 1.4236, "step": 22508 }, { "epoch": 0.61, "learning_rate": 6.826501420041043e-06, "loss": 1.3899, "step": 22509 }, { "epoch": 0.61, "learning_rate": 6.825662646738886e-06, "loss": 1.2749, "step": 22510 }, { "epoch": 0.61, "learning_rate": 6.824823898271256e-06, "loss": 1.3374, "step": 22511 }, { "epoch": 0.61, "learning_rate": 6.823985174644707e-06, "loss": 1.2305, "step": 22512 }, { "epoch": 0.61, "learning_rate": 6.8231464758658075e-06, "loss": 1.2751, "step": 22513 }, { "epoch": 0.61, "learning_rate": 6.822307801941113e-06, "loss": 1.812, "step": 22514 }, { "epoch": 0.61, "learning_rate": 6.821469152877191e-06, "loss": 1.1824, "step": 22515 }, { "epoch": 0.61, "learning_rate": 6.820630528680597e-06, "loss": 1.3469, "step": 22516 }, { "epoch": 0.61, "learning_rate": 6.819791929357897e-06, "loss": 1.1499, "step": 22517 }, { "epoch": 0.61, "learning_rate": 6.818953354915647e-06, "loss": 1.2935, "step": 22518 }, { "epoch": 0.61, "learning_rate": 6.818114805360409e-06, "loss": 1.3589, "step": 22519 }, { "epoch": 0.62, "learning_rate": 6.81727628069875e-06, "loss": 1.1807, "step": 22520 }, { "epoch": 0.62, "learning_rate": 6.81643778093722e-06, "loss": 1.2722, "step": 22521 }, { "epoch": 0.62, "learning_rate": 6.815599306082389e-06, "loss": 1.3359, "step": 22522 }, { "epoch": 0.62, "learning_rate": 6.8147608561408055e-06, "loss": 1.3438, "step": 22523 }, { "epoch": 0.62, "learning_rate": 6.81392243111904e-06, "loss": 1.1892, "step": 22524 }, { "epoch": 0.62, "learning_rate": 6.813084031023643e-06, "loss": 1.1958, "step": 22525 }, { "epoch": 0.62, "learning_rate": 6.8122456558611825e-06, "loss": 1.1831, "step": 22526 }, { "epoch": 0.62, "learning_rate": 6.811407305638209e-06, "loss": 1.1792, "step": 22527 }, { "epoch": 0.62, "learning_rate": 6.810568980361289e-06, "loss": 1.4143, "step": 22528 }, { "epoch": 0.62, "learning_rate": 6.8097306800369735e-06, "loss": 1.3389, "step": 22529 }, { "epoch": 0.62, "learning_rate": 6.808892404671829e-06, "loss": 1.2551, "step": 22530 }, { "epoch": 0.62, "learning_rate": 6.808054154272405e-06, "loss": 1.2341, "step": 22531 }, { "epoch": 0.62, "learning_rate": 6.807215928845271e-06, "loss": 1.3008, "step": 22532 }, { "epoch": 0.62, "learning_rate": 6.806377728396972e-06, "loss": 1.1841, "step": 22533 }, { "epoch": 0.62, "learning_rate": 6.805539552934073e-06, "loss": 1.2026, "step": 22534 }, { "epoch": 0.62, "learning_rate": 6.804701402463132e-06, "loss": 1.3215, "step": 22535 }, { "epoch": 0.62, "learning_rate": 6.8038632769907045e-06, "loss": 1.2615, "step": 22536 }, { "epoch": 0.62, "learning_rate": 6.8030251765233475e-06, "loss": 1.3247, "step": 22537 }, { "epoch": 0.62, "learning_rate": 6.802187101067619e-06, "loss": 1.0385, "step": 22538 }, { "epoch": 0.62, "learning_rate": 6.801349050630075e-06, "loss": 1.1185, "step": 22539 }, { "epoch": 0.62, "learning_rate": 6.80051102521727e-06, "loss": 1.304, "step": 22540 }, { "epoch": 0.62, "learning_rate": 6.799673024835765e-06, "loss": 1.2136, "step": 22541 }, { "epoch": 0.62, "learning_rate": 6.79883504949211e-06, "loss": 1.0933, "step": 22542 }, { "epoch": 0.62, "learning_rate": 6.797997099192868e-06, "loss": 1.2549, "step": 22543 }, { "epoch": 0.62, "learning_rate": 6.797159173944587e-06, "loss": 1.1982, "step": 22544 }, { "epoch": 0.62, "learning_rate": 6.79632127375383e-06, "loss": 1.292, "step": 22545 }, { "epoch": 0.62, "learning_rate": 6.795483398627147e-06, "loss": 1.4114, "step": 22546 }, { "epoch": 0.62, "learning_rate": 6.794645548571097e-06, "loss": 1.0453, "step": 22547 }, { "epoch": 0.62, "learning_rate": 6.79380772359223e-06, "loss": 1.3916, "step": 22548 }, { "epoch": 0.62, "learning_rate": 6.792969923697106e-06, "loss": 1.2747, "step": 22549 }, { "epoch": 0.62, "learning_rate": 6.792132148892276e-06, "loss": 1.3818, "step": 22550 }, { "epoch": 0.62, "learning_rate": 6.791294399184295e-06, "loss": 1.2305, "step": 22551 }, { "epoch": 0.62, "learning_rate": 6.790456674579719e-06, "loss": 1.311, "step": 22552 }, { "epoch": 0.62, "learning_rate": 6.789618975085101e-06, "loss": 1.3462, "step": 22553 }, { "epoch": 0.62, "learning_rate": 6.788781300706994e-06, "loss": 1.2234, "step": 22554 }, { "epoch": 0.62, "learning_rate": 6.787943651451951e-06, "loss": 1.2661, "step": 22555 }, { "epoch": 0.62, "learning_rate": 6.78710602732653e-06, "loss": 1.2959, "step": 22556 }, { "epoch": 0.62, "learning_rate": 6.7862684283372775e-06, "loss": 1.5017, "step": 22557 }, { "epoch": 0.62, "learning_rate": 6.785430854490751e-06, "loss": 1.332, "step": 22558 }, { "epoch": 0.62, "learning_rate": 6.784593305793501e-06, "loss": 1.4294, "step": 22559 }, { "epoch": 0.62, "learning_rate": 6.783755782252081e-06, "loss": 1.3179, "step": 22560 }, { "epoch": 0.62, "learning_rate": 6.782918283873043e-06, "loss": 1.688, "step": 22561 }, { "epoch": 0.62, "learning_rate": 6.7820808106629425e-06, "loss": 1.3662, "step": 22562 }, { "epoch": 0.62, "learning_rate": 6.781243362628325e-06, "loss": 1.2141, "step": 22563 }, { "epoch": 0.62, "learning_rate": 6.7804059397757475e-06, "loss": 1.1567, "step": 22564 }, { "epoch": 0.62, "learning_rate": 6.779568542111758e-06, "loss": 1.1204, "step": 22565 }, { "epoch": 0.62, "learning_rate": 6.778731169642909e-06, "loss": 1.2456, "step": 22566 }, { "epoch": 0.62, "learning_rate": 6.777893822375759e-06, "loss": 1.3279, "step": 22567 }, { "epoch": 0.62, "learning_rate": 6.7770565003168454e-06, "loss": 1.1941, "step": 22568 }, { "epoch": 0.62, "learning_rate": 6.776219203472732e-06, "loss": 1.1592, "step": 22569 }, { "epoch": 0.62, "learning_rate": 6.775381931849958e-06, "loss": 1.2615, "step": 22570 }, { "epoch": 0.62, "learning_rate": 6.7745446854550865e-06, "loss": 1.2749, "step": 22571 }, { "epoch": 0.62, "learning_rate": 6.773707464294654e-06, "loss": 1.3708, "step": 22572 }, { "epoch": 0.62, "learning_rate": 6.772870268375222e-06, "loss": 1.2986, "step": 22573 }, { "epoch": 0.62, "learning_rate": 6.772033097703331e-06, "loss": 1.3091, "step": 22574 }, { "epoch": 0.62, "learning_rate": 6.771195952285541e-06, "loss": 1.3652, "step": 22575 }, { "epoch": 0.62, "learning_rate": 6.77035883212839e-06, "loss": 1.3545, "step": 22576 }, { "epoch": 0.62, "learning_rate": 6.769521737238437e-06, "loss": 1.2617, "step": 22577 }, { "epoch": 0.62, "learning_rate": 6.7686846676222216e-06, "loss": 1.4004, "step": 22578 }, { "epoch": 0.62, "learning_rate": 6.767847623286304e-06, "loss": 1.3457, "step": 22579 }, { "epoch": 0.62, "learning_rate": 6.7670106042372206e-06, "loss": 1.3474, "step": 22580 }, { "epoch": 0.62, "learning_rate": 6.766173610481529e-06, "loss": 1.2356, "step": 22581 }, { "epoch": 0.62, "learning_rate": 6.765336642025776e-06, "loss": 1.2327, "step": 22582 }, { "epoch": 0.62, "learning_rate": 6.764499698876505e-06, "loss": 1.1055, "step": 22583 }, { "epoch": 0.62, "learning_rate": 6.76366278104027e-06, "loss": 1.3438, "step": 22584 }, { "epoch": 0.62, "learning_rate": 6.762825888523614e-06, "loss": 1.2866, "step": 22585 }, { "epoch": 0.62, "learning_rate": 6.761989021333086e-06, "loss": 1.2979, "step": 22586 }, { "epoch": 0.62, "learning_rate": 6.761152179475233e-06, "loss": 1.0842, "step": 22587 }, { "epoch": 0.62, "learning_rate": 6.760315362956604e-06, "loss": 1.2705, "step": 22588 }, { "epoch": 0.62, "learning_rate": 6.7594785717837415e-06, "loss": 1.1833, "step": 22589 }, { "epoch": 0.62, "learning_rate": 6.7586418059631975e-06, "loss": 1.3735, "step": 22590 }, { "epoch": 0.62, "learning_rate": 6.757805065501515e-06, "loss": 1.2798, "step": 22591 }, { "epoch": 0.62, "learning_rate": 6.756968350405242e-06, "loss": 1.167, "step": 22592 }, { "epoch": 0.62, "learning_rate": 6.75613166068092e-06, "loss": 1.3511, "step": 22593 }, { "epoch": 0.62, "learning_rate": 6.755294996335102e-06, "loss": 1.3083, "step": 22594 }, { "epoch": 0.62, "learning_rate": 6.754458357374329e-06, "loss": 1.325, "step": 22595 }, { "epoch": 0.62, "learning_rate": 6.753621743805147e-06, "loss": 1.647, "step": 22596 }, { "epoch": 0.62, "learning_rate": 6.752785155634103e-06, "loss": 1.3032, "step": 22597 }, { "epoch": 0.62, "learning_rate": 6.751948592867741e-06, "loss": 1.2252, "step": 22598 }, { "epoch": 0.62, "learning_rate": 6.7511120555126055e-06, "loss": 1.1536, "step": 22599 }, { "epoch": 0.62, "learning_rate": 6.750275543575241e-06, "loss": 1.1267, "step": 22600 }, { "epoch": 0.62, "learning_rate": 6.749439057062195e-06, "loss": 1.2151, "step": 22601 }, { "epoch": 0.62, "learning_rate": 6.748602595980005e-06, "loss": 1.0852, "step": 22602 }, { "epoch": 0.62, "learning_rate": 6.747766160335223e-06, "loss": 1.2927, "step": 22603 }, { "epoch": 0.62, "learning_rate": 6.746929750134388e-06, "loss": 1.3328, "step": 22604 }, { "epoch": 0.62, "learning_rate": 6.746093365384046e-06, "loss": 1.0613, "step": 22605 }, { "epoch": 0.62, "learning_rate": 6.745257006090737e-06, "loss": 1.408, "step": 22606 }, { "epoch": 0.62, "learning_rate": 6.74442067226101e-06, "loss": 1.1504, "step": 22607 }, { "epoch": 0.62, "learning_rate": 6.743584363901401e-06, "loss": 1.3904, "step": 22608 }, { "epoch": 0.62, "learning_rate": 6.7427480810184595e-06, "loss": 1.2812, "step": 22609 }, { "epoch": 0.62, "learning_rate": 6.741911823618723e-06, "loss": 1.2771, "step": 22610 }, { "epoch": 0.62, "learning_rate": 6.7410755917087385e-06, "loss": 1.4116, "step": 22611 }, { "epoch": 0.62, "learning_rate": 6.740239385295044e-06, "loss": 1.3574, "step": 22612 }, { "epoch": 0.62, "learning_rate": 6.739403204384183e-06, "loss": 1.2449, "step": 22613 }, { "epoch": 0.62, "learning_rate": 6.738567048982702e-06, "loss": 1.4324, "step": 22614 }, { "epoch": 0.62, "learning_rate": 6.737730919097135e-06, "loss": 1.3354, "step": 22615 }, { "epoch": 0.62, "learning_rate": 6.736894814734032e-06, "loss": 1.281, "step": 22616 }, { "epoch": 0.62, "learning_rate": 6.736058735899924e-06, "loss": 1.3999, "step": 22617 }, { "epoch": 0.62, "learning_rate": 6.735222682601363e-06, "loss": 1.3223, "step": 22618 }, { "epoch": 0.62, "learning_rate": 6.73438665484488e-06, "loss": 1.2002, "step": 22619 }, { "epoch": 0.62, "learning_rate": 6.733550652637024e-06, "loss": 1.3376, "step": 22620 }, { "epoch": 0.62, "learning_rate": 6.732714675984327e-06, "loss": 1.2507, "step": 22621 }, { "epoch": 0.62, "learning_rate": 6.7318787248933404e-06, "loss": 1.2571, "step": 22622 }, { "epoch": 0.62, "learning_rate": 6.731042799370591e-06, "loss": 1.228, "step": 22623 }, { "epoch": 0.62, "learning_rate": 6.730206899422632e-06, "loss": 1.1877, "step": 22624 }, { "epoch": 0.62, "learning_rate": 6.729371025055991e-06, "loss": 1.4058, "step": 22625 }, { "epoch": 0.62, "learning_rate": 6.7285351762772175e-06, "loss": 1.2986, "step": 22626 }, { "epoch": 0.62, "learning_rate": 6.727699353092842e-06, "loss": 1.2041, "step": 22627 }, { "epoch": 0.62, "learning_rate": 6.72686355550941e-06, "loss": 1.1716, "step": 22628 }, { "epoch": 0.62, "learning_rate": 6.72602778353346e-06, "loss": 1.2607, "step": 22629 }, { "epoch": 0.62, "learning_rate": 6.725192037171526e-06, "loss": 1.2961, "step": 22630 }, { "epoch": 0.62, "learning_rate": 6.724356316430154e-06, "loss": 1.4587, "step": 22631 }, { "epoch": 0.62, "learning_rate": 6.723520621315873e-06, "loss": 1.1978, "step": 22632 }, { "epoch": 0.62, "learning_rate": 6.72268495183523e-06, "loss": 1.2827, "step": 22633 }, { "epoch": 0.62, "learning_rate": 6.721849307994756e-06, "loss": 1.2229, "step": 22634 }, { "epoch": 0.62, "learning_rate": 6.721013689800995e-06, "loss": 1.2356, "step": 22635 }, { "epoch": 0.62, "learning_rate": 6.720178097260477e-06, "loss": 1.304, "step": 22636 }, { "epoch": 0.62, "learning_rate": 6.719342530379747e-06, "loss": 1.3186, "step": 22637 }, { "epoch": 0.62, "learning_rate": 6.718506989165336e-06, "loss": 1.2722, "step": 22638 }, { "epoch": 0.62, "learning_rate": 6.717671473623783e-06, "loss": 1.2612, "step": 22639 }, { "epoch": 0.62, "learning_rate": 6.7168359837616245e-06, "loss": 1.3572, "step": 22640 }, { "epoch": 0.62, "learning_rate": 6.7160005195854e-06, "loss": 1.1807, "step": 22641 }, { "epoch": 0.62, "learning_rate": 6.715165081101643e-06, "loss": 1.2209, "step": 22642 }, { "epoch": 0.62, "learning_rate": 6.714329668316886e-06, "loss": 1.2344, "step": 22643 }, { "epoch": 0.62, "learning_rate": 6.7134942812376724e-06, "loss": 1.0833, "step": 22644 }, { "epoch": 0.62, "learning_rate": 6.712658919870532e-06, "loss": 1.2366, "step": 22645 }, { "epoch": 0.62, "learning_rate": 6.711823584222004e-06, "loss": 1.2805, "step": 22646 }, { "epoch": 0.62, "learning_rate": 6.71098827429862e-06, "loss": 1.2698, "step": 22647 }, { "epoch": 0.62, "learning_rate": 6.71015299010692e-06, "loss": 1.6763, "step": 22648 }, { "epoch": 0.62, "learning_rate": 6.709317731653433e-06, "loss": 1.1674, "step": 22649 }, { "epoch": 0.62, "learning_rate": 6.708482498944699e-06, "loss": 1.7261, "step": 22650 }, { "epoch": 0.62, "learning_rate": 6.70764729198725e-06, "loss": 1.4106, "step": 22651 }, { "epoch": 0.62, "learning_rate": 6.7068121107876195e-06, "loss": 1.3247, "step": 22652 }, { "epoch": 0.62, "learning_rate": 6.705976955352342e-06, "loss": 1.2754, "step": 22653 }, { "epoch": 0.62, "learning_rate": 6.705141825687953e-06, "loss": 1.1882, "step": 22654 }, { "epoch": 0.62, "learning_rate": 6.704306721800984e-06, "loss": 1.4453, "step": 22655 }, { "epoch": 0.62, "learning_rate": 6.703471643697972e-06, "loss": 1.3369, "step": 22656 }, { "epoch": 0.62, "learning_rate": 6.702636591385444e-06, "loss": 1.2612, "step": 22657 }, { "epoch": 0.62, "learning_rate": 6.701801564869935e-06, "loss": 1.4443, "step": 22658 }, { "epoch": 0.62, "learning_rate": 6.700966564157987e-06, "loss": 1.4241, "step": 22659 }, { "epoch": 0.62, "learning_rate": 6.700131589256118e-06, "loss": 1.3962, "step": 22660 }, { "epoch": 0.62, "learning_rate": 6.6992966401708746e-06, "loss": 1.2661, "step": 22661 }, { "epoch": 0.62, "learning_rate": 6.698461716908775e-06, "loss": 1.3333, "step": 22662 }, { "epoch": 0.62, "learning_rate": 6.697626819476366e-06, "loss": 1.2241, "step": 22663 }, { "epoch": 0.62, "learning_rate": 6.696791947880166e-06, "loss": 1.4604, "step": 22664 }, { "epoch": 0.62, "learning_rate": 6.6959571021267165e-06, "loss": 1.0613, "step": 22665 }, { "epoch": 0.62, "learning_rate": 6.695122282222541e-06, "loss": 1.4019, "step": 22666 }, { "epoch": 0.62, "learning_rate": 6.6942874881741796e-06, "loss": 1.3057, "step": 22667 }, { "epoch": 0.62, "learning_rate": 6.693452719988152e-06, "loss": 1.292, "step": 22668 }, { "epoch": 0.62, "learning_rate": 6.692617977671003e-06, "loss": 1.2439, "step": 22669 }, { "epoch": 0.62, "learning_rate": 6.691783261229248e-06, "loss": 1.332, "step": 22670 }, { "epoch": 0.62, "learning_rate": 6.69094857066943e-06, "loss": 1.2668, "step": 22671 }, { "epoch": 0.62, "learning_rate": 6.690113905998072e-06, "loss": 1.1775, "step": 22672 }, { "epoch": 0.62, "learning_rate": 6.689279267221709e-06, "loss": 1.3379, "step": 22673 }, { "epoch": 0.62, "learning_rate": 6.6884446543468665e-06, "loss": 1.2388, "step": 22674 }, { "epoch": 0.62, "learning_rate": 6.687610067380075e-06, "loss": 1.3313, "step": 22675 }, { "epoch": 0.62, "learning_rate": 6.686775506327867e-06, "loss": 1.1328, "step": 22676 }, { "epoch": 0.62, "learning_rate": 6.685940971196767e-06, "loss": 1.3081, "step": 22677 }, { "epoch": 0.62, "learning_rate": 6.685106461993309e-06, "loss": 1.3696, "step": 22678 }, { "epoch": 0.62, "learning_rate": 6.684271978724017e-06, "loss": 1.2866, "step": 22679 }, { "epoch": 0.62, "learning_rate": 6.683437521395424e-06, "loss": 1.304, "step": 22680 }, { "epoch": 0.62, "learning_rate": 6.682603090014055e-06, "loss": 1.3257, "step": 22681 }, { "epoch": 0.62, "learning_rate": 6.68176868458644e-06, "loss": 1.3516, "step": 22682 }, { "epoch": 0.62, "learning_rate": 6.680934305119106e-06, "loss": 1.2512, "step": 22683 }, { "epoch": 0.62, "learning_rate": 6.6800999516185815e-06, "loss": 1.3369, "step": 22684 }, { "epoch": 0.62, "learning_rate": 6.6792656240913936e-06, "loss": 1.6543, "step": 22685 }, { "epoch": 0.62, "learning_rate": 6.67843132254407e-06, "loss": 1.2673, "step": 22686 }, { "epoch": 0.62, "learning_rate": 6.6775970469831375e-06, "loss": 1.3865, "step": 22687 }, { "epoch": 0.62, "learning_rate": 6.676762797415125e-06, "loss": 1.165, "step": 22688 }, { "epoch": 0.62, "learning_rate": 6.675928573846555e-06, "loss": 1.2019, "step": 22689 }, { "epoch": 0.62, "learning_rate": 6.675094376283958e-06, "loss": 1.2927, "step": 22690 }, { "epoch": 0.62, "learning_rate": 6.67426020473386e-06, "loss": 1.3386, "step": 22691 }, { "epoch": 0.62, "learning_rate": 6.673426059202786e-06, "loss": 1.3318, "step": 22692 }, { "epoch": 0.62, "learning_rate": 6.672591939697261e-06, "loss": 1.4409, "step": 22693 }, { "epoch": 0.62, "learning_rate": 6.671757846223813e-06, "loss": 1.0779, "step": 22694 }, { "epoch": 0.62, "learning_rate": 6.6709237787889684e-06, "loss": 1.2429, "step": 22695 }, { "epoch": 0.62, "learning_rate": 6.6700897373992475e-06, "loss": 1.1614, "step": 22696 }, { "epoch": 0.62, "learning_rate": 6.669255722061181e-06, "loss": 1.3394, "step": 22697 }, { "epoch": 0.62, "learning_rate": 6.66842173278129e-06, "loss": 1.6436, "step": 22698 }, { "epoch": 0.62, "learning_rate": 6.667587769566102e-06, "loss": 1.2825, "step": 22699 }, { "epoch": 0.62, "learning_rate": 6.666753832422138e-06, "loss": 1.1951, "step": 22700 }, { "epoch": 0.62, "learning_rate": 6.665919921355928e-06, "loss": 1.3555, "step": 22701 }, { "epoch": 0.62, "learning_rate": 6.665086036373989e-06, "loss": 1.2212, "step": 22702 }, { "epoch": 0.62, "learning_rate": 6.6642521774828515e-06, "loss": 1.2949, "step": 22703 }, { "epoch": 0.62, "learning_rate": 6.663418344689032e-06, "loss": 1.2925, "step": 22704 }, { "epoch": 0.62, "learning_rate": 6.6625845379990615e-06, "loss": 1.3137, "step": 22705 }, { "epoch": 0.62, "learning_rate": 6.661750757419462e-06, "loss": 1.158, "step": 22706 }, { "epoch": 0.62, "learning_rate": 6.660917002956753e-06, "loss": 1.325, "step": 22707 }, { "epoch": 0.62, "learning_rate": 6.660083274617459e-06, "loss": 1.1711, "step": 22708 }, { "epoch": 0.62, "learning_rate": 6.659249572408103e-06, "loss": 1.6772, "step": 22709 }, { "epoch": 0.62, "learning_rate": 6.658415896335209e-06, "loss": 1.1755, "step": 22710 }, { "epoch": 0.62, "learning_rate": 6.6575822464052966e-06, "loss": 1.2937, "step": 22711 }, { "epoch": 0.62, "learning_rate": 6.656748622624889e-06, "loss": 1.1353, "step": 22712 }, { "epoch": 0.62, "learning_rate": 6.655915025000508e-06, "loss": 1.3267, "step": 22713 }, { "epoch": 0.62, "learning_rate": 6.655081453538675e-06, "loss": 1.2542, "step": 22714 }, { "epoch": 0.62, "learning_rate": 6.654247908245912e-06, "loss": 1.2551, "step": 22715 }, { "epoch": 0.62, "learning_rate": 6.653414389128741e-06, "loss": 1.2668, "step": 22716 }, { "epoch": 0.62, "learning_rate": 6.6525808961936815e-06, "loss": 1.2498, "step": 22717 }, { "epoch": 0.62, "learning_rate": 6.651747429447255e-06, "loss": 1.3564, "step": 22718 }, { "epoch": 0.62, "learning_rate": 6.650913988895982e-06, "loss": 1.4219, "step": 22719 }, { "epoch": 0.62, "learning_rate": 6.650080574546384e-06, "loss": 1.3281, "step": 22720 }, { "epoch": 0.62, "learning_rate": 6.649247186404979e-06, "loss": 1.2595, "step": 22721 }, { "epoch": 0.62, "learning_rate": 6.648413824478287e-06, "loss": 1.2056, "step": 22722 }, { "epoch": 0.62, "learning_rate": 6.647580488772832e-06, "loss": 1.2898, "step": 22723 }, { "epoch": 0.62, "learning_rate": 6.6467471792951295e-06, "loss": 1.3372, "step": 22724 }, { "epoch": 0.62, "learning_rate": 6.645913896051701e-06, "loss": 1.5015, "step": 22725 }, { "epoch": 0.62, "learning_rate": 6.645080639049064e-06, "loss": 1.2522, "step": 22726 }, { "epoch": 0.62, "learning_rate": 6.64424740829374e-06, "loss": 1.1482, "step": 22727 }, { "epoch": 0.62, "learning_rate": 6.643414203792244e-06, "loss": 1.2615, "step": 22728 }, { "epoch": 0.62, "learning_rate": 6.642581025551101e-06, "loss": 1.248, "step": 22729 }, { "epoch": 0.62, "learning_rate": 6.641747873576822e-06, "loss": 1.1309, "step": 22730 }, { "epoch": 0.62, "learning_rate": 6.640914747875929e-06, "loss": 1.1392, "step": 22731 }, { "epoch": 0.62, "learning_rate": 6.640081648454939e-06, "loss": 1.2344, "step": 22732 }, { "epoch": 0.62, "learning_rate": 6.639248575320372e-06, "loss": 1.3086, "step": 22733 }, { "epoch": 0.62, "learning_rate": 6.638415528478741e-06, "loss": 1.3447, "step": 22734 }, { "epoch": 0.62, "learning_rate": 6.637582507936569e-06, "loss": 1.353, "step": 22735 }, { "epoch": 0.62, "learning_rate": 6.636749513700369e-06, "loss": 1.272, "step": 22736 }, { "epoch": 0.62, "learning_rate": 6.635916545776656e-06, "loss": 1.2317, "step": 22737 }, { "epoch": 0.62, "learning_rate": 6.635083604171957e-06, "loss": 1.0999, "step": 22738 }, { "epoch": 0.62, "learning_rate": 6.634250688892775e-06, "loss": 1.3369, "step": 22739 }, { "epoch": 0.62, "learning_rate": 6.633417799945638e-06, "loss": 1.2612, "step": 22740 }, { "epoch": 0.62, "learning_rate": 6.632584937337054e-06, "loss": 1.2993, "step": 22741 }, { "epoch": 0.62, "learning_rate": 6.631752101073545e-06, "loss": 1.291, "step": 22742 }, { "epoch": 0.62, "learning_rate": 6.630919291161619e-06, "loss": 1.1479, "step": 22743 }, { "epoch": 0.62, "learning_rate": 6.630086507607803e-06, "loss": 1.2136, "step": 22744 }, { "epoch": 0.62, "learning_rate": 6.629253750418597e-06, "loss": 1.2551, "step": 22745 }, { "epoch": 0.62, "learning_rate": 6.628421019600533e-06, "loss": 1.2783, "step": 22746 }, { "epoch": 0.62, "learning_rate": 6.6275883151601095e-06, "loss": 1.2666, "step": 22747 }, { "epoch": 0.62, "learning_rate": 6.626755637103857e-06, "loss": 1.2314, "step": 22748 }, { "epoch": 0.62, "learning_rate": 6.625922985438275e-06, "loss": 1.3486, "step": 22749 }, { "epoch": 0.62, "learning_rate": 6.625090360169892e-06, "loss": 1.257, "step": 22750 }, { "epoch": 0.62, "learning_rate": 6.624257761305209e-06, "loss": 1.4746, "step": 22751 }, { "epoch": 0.62, "learning_rate": 6.6234251888507475e-06, "loss": 1.2434, "step": 22752 }, { "epoch": 0.62, "learning_rate": 6.622592642813021e-06, "loss": 1.3, "step": 22753 }, { "epoch": 0.62, "learning_rate": 6.62176012319854e-06, "loss": 1.3613, "step": 22754 }, { "epoch": 0.62, "learning_rate": 6.62092763001382e-06, "loss": 1.3877, "step": 22755 }, { "epoch": 0.62, "learning_rate": 6.6200951632653744e-06, "loss": 1.3801, "step": 22756 }, { "epoch": 0.62, "learning_rate": 6.619262722959714e-06, "loss": 1.3591, "step": 22757 }, { "epoch": 0.62, "learning_rate": 6.618430309103352e-06, "loss": 1.3538, "step": 22758 }, { "epoch": 0.62, "learning_rate": 6.617597921702802e-06, "loss": 1.2246, "step": 22759 }, { "epoch": 0.62, "learning_rate": 6.616765560764573e-06, "loss": 1.2905, "step": 22760 }, { "epoch": 0.62, "learning_rate": 6.615933226295182e-06, "loss": 1.2903, "step": 22761 }, { "epoch": 0.62, "learning_rate": 6.615100918301137e-06, "loss": 1.1372, "step": 22762 }, { "epoch": 0.62, "learning_rate": 6.6142686367889516e-06, "loss": 1.3452, "step": 22763 }, { "epoch": 0.62, "learning_rate": 6.613436381765135e-06, "loss": 1.2188, "step": 22764 }, { "epoch": 0.62, "learning_rate": 6.612604153236202e-06, "loss": 1.3538, "step": 22765 }, { "epoch": 0.62, "learning_rate": 6.6117719512086585e-06, "loss": 1.2097, "step": 22766 }, { "epoch": 0.62, "learning_rate": 6.610939775689018e-06, "loss": 1.3135, "step": 22767 }, { "epoch": 0.62, "learning_rate": 6.610107626683793e-06, "loss": 1.3804, "step": 22768 }, { "epoch": 0.62, "learning_rate": 6.6092755041994894e-06, "loss": 1.2615, "step": 22769 }, { "epoch": 0.62, "learning_rate": 6.608443408242623e-06, "loss": 1.3328, "step": 22770 }, { "epoch": 0.62, "learning_rate": 6.607611338819697e-06, "loss": 1.219, "step": 22771 }, { "epoch": 0.62, "learning_rate": 6.606779295937229e-06, "loss": 1.373, "step": 22772 }, { "epoch": 0.62, "learning_rate": 6.605947279601721e-06, "loss": 1.2742, "step": 22773 }, { "epoch": 0.62, "learning_rate": 6.605115289819686e-06, "loss": 1.3616, "step": 22774 }, { "epoch": 0.62, "learning_rate": 6.604283326597633e-06, "loss": 1.2412, "step": 22775 }, { "epoch": 0.62, "learning_rate": 6.60345138994207e-06, "loss": 1.2092, "step": 22776 }, { "epoch": 0.62, "learning_rate": 6.6026194798595065e-06, "loss": 1.2078, "step": 22777 }, { "epoch": 0.62, "learning_rate": 6.601787596356451e-06, "loss": 1.4019, "step": 22778 }, { "epoch": 0.62, "learning_rate": 6.600955739439411e-06, "loss": 1.3811, "step": 22779 }, { "epoch": 0.62, "learning_rate": 6.600123909114895e-06, "loss": 1.439, "step": 22780 }, { "epoch": 0.62, "learning_rate": 6.59929210538941e-06, "loss": 1.2244, "step": 22781 }, { "epoch": 0.62, "learning_rate": 6.598460328269467e-06, "loss": 1.3542, "step": 22782 }, { "epoch": 0.62, "learning_rate": 6.597628577761568e-06, "loss": 1.6025, "step": 22783 }, { "epoch": 0.62, "learning_rate": 6.596796853872221e-06, "loss": 1.3074, "step": 22784 }, { "epoch": 0.62, "learning_rate": 6.595965156607942e-06, "loss": 1.3779, "step": 22785 }, { "epoch": 0.62, "learning_rate": 6.595133485975224e-06, "loss": 1.2764, "step": 22786 }, { "epoch": 0.62, "learning_rate": 6.594301841980586e-06, "loss": 1.2991, "step": 22787 }, { "epoch": 0.62, "learning_rate": 6.593470224630525e-06, "loss": 1.2458, "step": 22788 }, { "epoch": 0.62, "learning_rate": 6.592638633931555e-06, "loss": 1.1643, "step": 22789 }, { "epoch": 0.62, "learning_rate": 6.591807069890173e-06, "loss": 1.1895, "step": 22790 }, { "epoch": 0.62, "learning_rate": 6.590975532512895e-06, "loss": 1.375, "step": 22791 }, { "epoch": 0.62, "learning_rate": 6.590144021806217e-06, "loss": 1.3164, "step": 22792 }, { "epoch": 0.62, "learning_rate": 6.5893125377766545e-06, "loss": 1.3291, "step": 22793 }, { "epoch": 0.62, "learning_rate": 6.5884810804307e-06, "loss": 1.4426, "step": 22794 }, { "epoch": 0.62, "learning_rate": 6.587649649774872e-06, "loss": 1.3174, "step": 22795 }, { "epoch": 0.62, "learning_rate": 6.586818245815662e-06, "loss": 1.1866, "step": 22796 }, { "epoch": 0.62, "learning_rate": 6.585986868559586e-06, "loss": 1.2385, "step": 22797 }, { "epoch": 0.62, "learning_rate": 6.58515551801314e-06, "loss": 1.3123, "step": 22798 }, { "epoch": 0.62, "learning_rate": 6.584324194182832e-06, "loss": 1.0908, "step": 22799 }, { "epoch": 0.62, "learning_rate": 6.583492897075166e-06, "loss": 1.0894, "step": 22800 }, { "epoch": 0.62, "learning_rate": 6.582661626696645e-06, "loss": 1.2737, "step": 22801 }, { "epoch": 0.62, "learning_rate": 6.581830383053773e-06, "loss": 1.2485, "step": 22802 }, { "epoch": 0.62, "learning_rate": 6.580999166153053e-06, "loss": 1.2566, "step": 22803 }, { "epoch": 0.62, "learning_rate": 6.5801679760009885e-06, "loss": 1.3708, "step": 22804 }, { "epoch": 0.62, "learning_rate": 6.579336812604078e-06, "loss": 1.2595, "step": 22805 }, { "epoch": 0.62, "learning_rate": 6.578505675968831e-06, "loss": 1.312, "step": 22806 }, { "epoch": 0.62, "learning_rate": 6.5776745661017464e-06, "loss": 1.1753, "step": 22807 }, { "epoch": 0.62, "learning_rate": 6.576843483009327e-06, "loss": 1.1887, "step": 22808 }, { "epoch": 0.62, "learning_rate": 6.576012426698073e-06, "loss": 1.2944, "step": 22809 }, { "epoch": 0.62, "learning_rate": 6.575181397174489e-06, "loss": 1.241, "step": 22810 }, { "epoch": 0.62, "learning_rate": 6.574350394445074e-06, "loss": 1.2791, "step": 22811 }, { "epoch": 0.62, "learning_rate": 6.573519418516332e-06, "loss": 1.3337, "step": 22812 }, { "epoch": 0.62, "learning_rate": 6.572688469394762e-06, "loss": 1.3149, "step": 22813 }, { "epoch": 0.62, "learning_rate": 6.571857547086864e-06, "loss": 1.2112, "step": 22814 }, { "epoch": 0.62, "learning_rate": 6.571026651599144e-06, "loss": 1.3994, "step": 22815 }, { "epoch": 0.62, "learning_rate": 6.570195782938097e-06, "loss": 1.272, "step": 22816 }, { "epoch": 0.62, "learning_rate": 6.569364941110227e-06, "loss": 1.3604, "step": 22817 }, { "epoch": 0.62, "learning_rate": 6.5685341261220306e-06, "loss": 1.0743, "step": 22818 }, { "epoch": 0.62, "learning_rate": 6.5677033379800116e-06, "loss": 1.228, "step": 22819 }, { "epoch": 0.62, "learning_rate": 6.566872576690666e-06, "loss": 1.4805, "step": 22820 }, { "epoch": 0.62, "learning_rate": 6.566041842260495e-06, "loss": 1.3386, "step": 22821 }, { "epoch": 0.62, "learning_rate": 6.565211134695999e-06, "loss": 1.1743, "step": 22822 }, { "epoch": 0.62, "learning_rate": 6.564380454003676e-06, "loss": 1.1064, "step": 22823 }, { "epoch": 0.62, "learning_rate": 6.5635498001900235e-06, "loss": 1.2539, "step": 22824 }, { "epoch": 0.62, "learning_rate": 6.5627191732615424e-06, "loss": 1.1912, "step": 22825 }, { "epoch": 0.62, "learning_rate": 6.5618885732247295e-06, "loss": 1.3601, "step": 22826 }, { "epoch": 0.62, "learning_rate": 6.561058000086085e-06, "loss": 1.1257, "step": 22827 }, { "epoch": 0.62, "learning_rate": 6.560227453852104e-06, "loss": 1.161, "step": 22828 }, { "epoch": 0.62, "learning_rate": 6.559396934529283e-06, "loss": 1.7202, "step": 22829 }, { "epoch": 0.62, "learning_rate": 6.55856644212413e-06, "loss": 1.4136, "step": 22830 }, { "epoch": 0.62, "learning_rate": 6.557735976643127e-06, "loss": 1.2153, "step": 22831 }, { "epoch": 0.62, "learning_rate": 6.556905538092786e-06, "loss": 1.2571, "step": 22832 }, { "epoch": 0.62, "learning_rate": 6.5560751264795905e-06, "loss": 1.4353, "step": 22833 }, { "epoch": 0.62, "learning_rate": 6.555244741810051e-06, "loss": 1.4224, "step": 22834 }, { "epoch": 0.62, "learning_rate": 6.55441438409065e-06, "loss": 1.1687, "step": 22835 }, { "epoch": 0.62, "learning_rate": 6.553584053327897e-06, "loss": 1.3252, "step": 22836 }, { "epoch": 0.62, "learning_rate": 6.552753749528276e-06, "loss": 1.3301, "step": 22837 }, { "epoch": 0.62, "learning_rate": 6.5519234726982935e-06, "loss": 1.1987, "step": 22838 }, { "epoch": 0.62, "learning_rate": 6.551093222844436e-06, "loss": 1.2417, "step": 22839 }, { "epoch": 0.62, "learning_rate": 6.550262999973207e-06, "loss": 1.1255, "step": 22840 }, { "epoch": 0.62, "learning_rate": 6.549432804091094e-06, "loss": 1.1501, "step": 22841 }, { "epoch": 0.62, "learning_rate": 6.5486026352046014e-06, "loss": 1.2397, "step": 22842 }, { "epoch": 0.62, "learning_rate": 6.5477724933202135e-06, "loss": 1.0977, "step": 22843 }, { "epoch": 0.62, "learning_rate": 6.546942378444437e-06, "loss": 1.2019, "step": 22844 }, { "epoch": 0.62, "learning_rate": 6.546112290583751e-06, "loss": 1.2249, "step": 22845 }, { "epoch": 0.62, "learning_rate": 6.545282229744662e-06, "loss": 1.1763, "step": 22846 }, { "epoch": 0.62, "learning_rate": 6.544452195933662e-06, "loss": 1.0469, "step": 22847 }, { "epoch": 0.62, "learning_rate": 6.543622189157242e-06, "loss": 1.1924, "step": 22848 }, { "epoch": 0.62, "learning_rate": 6.542792209421896e-06, "loss": 1.1755, "step": 22849 }, { "epoch": 0.62, "learning_rate": 6.541962256734118e-06, "loss": 1.3806, "step": 22850 }, { "epoch": 0.62, "learning_rate": 6.5411323311004035e-06, "loss": 1.1208, "step": 22851 }, { "epoch": 0.62, "learning_rate": 6.540302432527241e-06, "loss": 1.3079, "step": 22852 }, { "epoch": 0.62, "learning_rate": 6.539472561021127e-06, "loss": 1.4155, "step": 22853 }, { "epoch": 0.62, "learning_rate": 6.538642716588551e-06, "loss": 1.1069, "step": 22854 }, { "epoch": 0.62, "learning_rate": 6.537812899236008e-06, "loss": 1.4014, "step": 22855 }, { "epoch": 0.62, "learning_rate": 6.536983108969988e-06, "loss": 1.6426, "step": 22856 }, { "epoch": 0.62, "learning_rate": 6.536153345796984e-06, "loss": 1.1338, "step": 22857 }, { "epoch": 0.62, "learning_rate": 6.535323609723486e-06, "loss": 1.2622, "step": 22858 }, { "epoch": 0.62, "learning_rate": 6.534493900755989e-06, "loss": 1.2778, "step": 22859 }, { "epoch": 0.62, "learning_rate": 6.5336642189009816e-06, "loss": 1.3162, "step": 22860 }, { "epoch": 0.62, "learning_rate": 6.532834564164954e-06, "loss": 1.2349, "step": 22861 }, { "epoch": 0.62, "learning_rate": 6.532004936554399e-06, "loss": 1.2166, "step": 22862 }, { "epoch": 0.62, "learning_rate": 6.531175336075807e-06, "loss": 1.3328, "step": 22863 }, { "epoch": 0.62, "learning_rate": 6.530345762735668e-06, "loss": 1.311, "step": 22864 }, { "epoch": 0.62, "learning_rate": 6.5295162165404725e-06, "loss": 1.322, "step": 22865 }, { "epoch": 0.62, "learning_rate": 6.528686697496711e-06, "loss": 1.2668, "step": 22866 }, { "epoch": 0.62, "learning_rate": 6.52785720561087e-06, "loss": 1.2462, "step": 22867 }, { "epoch": 0.62, "learning_rate": 6.5270277408894445e-06, "loss": 1.209, "step": 22868 }, { "epoch": 0.62, "learning_rate": 6.526198303338918e-06, "loss": 1.1912, "step": 22869 }, { "epoch": 0.62, "learning_rate": 6.525368892965784e-06, "loss": 1.3567, "step": 22870 }, { "epoch": 0.62, "learning_rate": 6.5245395097765285e-06, "loss": 1.3347, "step": 22871 }, { "epoch": 0.62, "learning_rate": 6.523710153777645e-06, "loss": 1.248, "step": 22872 }, { "epoch": 0.62, "learning_rate": 6.522880824975615e-06, "loss": 1.2272, "step": 22873 }, { "epoch": 0.62, "learning_rate": 6.522051523376933e-06, "loss": 1.1965, "step": 22874 }, { "epoch": 0.62, "learning_rate": 6.5212222489880815e-06, "loss": 1.2378, "step": 22875 }, { "epoch": 0.62, "learning_rate": 6.52039300181555e-06, "loss": 1.3545, "step": 22876 }, { "epoch": 0.62, "learning_rate": 6.5195637818658346e-06, "loss": 1.3662, "step": 22877 }, { "epoch": 0.62, "learning_rate": 6.518734589145407e-06, "loss": 1.0508, "step": 22878 }, { "epoch": 0.62, "learning_rate": 6.517905423660771e-06, "loss": 1.1501, "step": 22879 }, { "epoch": 0.62, "learning_rate": 6.517076285418398e-06, "loss": 1.1292, "step": 22880 }, { "epoch": 0.62, "learning_rate": 6.51624717442479e-06, "loss": 1.7334, "step": 22881 }, { "epoch": 0.62, "learning_rate": 6.515418090686418e-06, "loss": 1.2607, "step": 22882 }, { "epoch": 0.62, "learning_rate": 6.514589034209784e-06, "loss": 1.3237, "step": 22883 }, { "epoch": 0.62, "learning_rate": 6.513760005001359e-06, "loss": 1.3115, "step": 22884 }, { "epoch": 0.62, "learning_rate": 6.512931003067644e-06, "loss": 1.3259, "step": 22885 }, { "epoch": 0.63, "learning_rate": 6.5121020284151105e-06, "loss": 1.0815, "step": 22886 }, { "epoch": 0.63, "learning_rate": 6.511273081050257e-06, "loss": 1.2234, "step": 22887 }, { "epoch": 0.63, "learning_rate": 6.510444160979555e-06, "loss": 1.3667, "step": 22888 }, { "epoch": 0.63, "learning_rate": 6.509615268209504e-06, "loss": 1.312, "step": 22889 }, { "epoch": 0.63, "learning_rate": 6.508786402746576e-06, "loss": 1.3604, "step": 22890 }, { "epoch": 0.63, "learning_rate": 6.507957564597262e-06, "loss": 1.2595, "step": 22891 }, { "epoch": 0.63, "learning_rate": 6.507128753768051e-06, "loss": 1.2019, "step": 22892 }, { "epoch": 0.63, "learning_rate": 6.506299970265417e-06, "loss": 1.2395, "step": 22893 }, { "epoch": 0.63, "learning_rate": 6.505471214095853e-06, "loss": 1.2014, "step": 22894 }, { "epoch": 0.63, "learning_rate": 6.5046424852658364e-06, "loss": 1.3069, "step": 22895 }, { "epoch": 0.63, "learning_rate": 6.503813783781856e-06, "loss": 1.2676, "step": 22896 }, { "epoch": 0.63, "learning_rate": 6.5029851096503895e-06, "loss": 1.2695, "step": 22897 }, { "epoch": 0.63, "learning_rate": 6.502156462877925e-06, "loss": 1.2783, "step": 22898 }, { "epoch": 0.63, "learning_rate": 6.501327843470943e-06, "loss": 1.3406, "step": 22899 }, { "epoch": 0.63, "learning_rate": 6.500499251435928e-06, "loss": 1.4934, "step": 22900 }, { "epoch": 0.63, "learning_rate": 6.499670686779358e-06, "loss": 1.3369, "step": 22901 }, { "epoch": 0.63, "learning_rate": 6.498842149507722e-06, "loss": 1.3599, "step": 22902 }, { "epoch": 0.63, "learning_rate": 6.498013639627496e-06, "loss": 1.2974, "step": 22903 }, { "epoch": 0.63, "learning_rate": 6.4971851571451675e-06, "loss": 1.4751, "step": 22904 }, { "epoch": 0.63, "learning_rate": 6.496356702067212e-06, "loss": 1.2329, "step": 22905 }, { "epoch": 0.63, "learning_rate": 6.495528274400117e-06, "loss": 1.0076, "step": 22906 }, { "epoch": 0.63, "learning_rate": 6.4946998741503585e-06, "loss": 1.209, "step": 22907 }, { "epoch": 0.63, "learning_rate": 6.49387150132442e-06, "loss": 1.3867, "step": 22908 }, { "epoch": 0.63, "learning_rate": 6.493043155928785e-06, "loss": 1.345, "step": 22909 }, { "epoch": 0.63, "learning_rate": 6.492214837969928e-06, "loss": 1.3645, "step": 22910 }, { "epoch": 0.63, "learning_rate": 6.491386547454335e-06, "loss": 1.2832, "step": 22911 }, { "epoch": 0.63, "learning_rate": 6.4905582843884815e-06, "loss": 1.2043, "step": 22912 }, { "epoch": 0.63, "learning_rate": 6.4897300487788515e-06, "loss": 1.1831, "step": 22913 }, { "epoch": 0.63, "learning_rate": 6.488901840631922e-06, "loss": 1.2898, "step": 22914 }, { "epoch": 0.63, "learning_rate": 6.488073659954175e-06, "loss": 1.2839, "step": 22915 }, { "epoch": 0.63, "learning_rate": 6.487245506752086e-06, "loss": 1.79, "step": 22916 }, { "epoch": 0.63, "learning_rate": 6.486417381032139e-06, "loss": 1.0854, "step": 22917 }, { "epoch": 0.63, "learning_rate": 6.485589282800807e-06, "loss": 1.6348, "step": 22918 }, { "epoch": 0.63, "learning_rate": 6.484761212064574e-06, "loss": 1.4121, "step": 22919 }, { "epoch": 0.63, "learning_rate": 6.483933168829916e-06, "loss": 1.2356, "step": 22920 }, { "epoch": 0.63, "learning_rate": 6.483105153103313e-06, "loss": 1.3723, "step": 22921 }, { "epoch": 0.63, "learning_rate": 6.482277164891237e-06, "loss": 1.231, "step": 22922 }, { "epoch": 0.63, "learning_rate": 6.481449204200172e-06, "loss": 1.3237, "step": 22923 }, { "epoch": 0.63, "learning_rate": 6.480621271036598e-06, "loss": 1.3628, "step": 22924 }, { "epoch": 0.63, "learning_rate": 6.479793365406981e-06, "loss": 1.3611, "step": 22925 }, { "epoch": 0.63, "learning_rate": 6.478965487317814e-06, "loss": 1.135, "step": 22926 }, { "epoch": 0.63, "learning_rate": 6.478137636775557e-06, "loss": 1.1902, "step": 22927 }, { "epoch": 0.63, "learning_rate": 6.477309813786703e-06, "loss": 1.3176, "step": 22928 }, { "epoch": 0.63, "learning_rate": 6.476482018357713e-06, "loss": 1.26, "step": 22929 }, { "epoch": 0.63, "learning_rate": 6.4756542504950784e-06, "loss": 1.1592, "step": 22930 }, { "epoch": 0.63, "learning_rate": 6.474826510205261e-06, "loss": 1.21, "step": 22931 }, { "epoch": 0.63, "learning_rate": 6.473998797494749e-06, "loss": 1.3252, "step": 22932 }, { "epoch": 0.63, "learning_rate": 6.4731711123700055e-06, "loss": 1.6841, "step": 22933 }, { "epoch": 0.63, "learning_rate": 6.47234345483752e-06, "loss": 1.0438, "step": 22934 }, { "epoch": 0.63, "learning_rate": 6.471515824903755e-06, "loss": 1.3401, "step": 22935 }, { "epoch": 0.63, "learning_rate": 6.470688222575194e-06, "loss": 1.2402, "step": 22936 }, { "epoch": 0.63, "learning_rate": 6.469860647858306e-06, "loss": 1.2715, "step": 22937 }, { "epoch": 0.63, "learning_rate": 6.46903310075957e-06, "loss": 1.3574, "step": 22938 }, { "epoch": 0.63, "learning_rate": 6.46820558128546e-06, "loss": 1.3665, "step": 22939 }, { "epoch": 0.63, "learning_rate": 6.4673780894424465e-06, "loss": 1.2041, "step": 22940 }, { "epoch": 0.63, "learning_rate": 6.466550625237007e-06, "loss": 1.1917, "step": 22941 }, { "epoch": 0.63, "learning_rate": 6.465723188675613e-06, "loss": 1.3254, "step": 22942 }, { "epoch": 0.63, "learning_rate": 6.464895779764742e-06, "loss": 1.2629, "step": 22943 }, { "epoch": 0.63, "learning_rate": 6.464068398510859e-06, "loss": 1.3928, "step": 22944 }, { "epoch": 0.63, "learning_rate": 6.463241044920447e-06, "loss": 1.1953, "step": 22945 }, { "epoch": 0.63, "learning_rate": 6.46241371899997e-06, "loss": 1.2563, "step": 22946 }, { "epoch": 0.63, "learning_rate": 6.461586420755908e-06, "loss": 1.3706, "step": 22947 }, { "epoch": 0.63, "learning_rate": 6.460759150194726e-06, "loss": 1.1929, "step": 22948 }, { "epoch": 0.63, "learning_rate": 6.459931907322904e-06, "loss": 1.3389, "step": 22949 }, { "epoch": 0.63, "learning_rate": 6.459104692146907e-06, "loss": 1.3711, "step": 22950 }, { "epoch": 0.63, "learning_rate": 6.4582775046732135e-06, "loss": 1.4485, "step": 22951 }, { "epoch": 0.63, "learning_rate": 6.457450344908287e-06, "loss": 1.3301, "step": 22952 }, { "epoch": 0.63, "learning_rate": 6.456623212858605e-06, "loss": 1.3826, "step": 22953 }, { "epoch": 0.63, "learning_rate": 6.455796108530639e-06, "loss": 1.2742, "step": 22954 }, { "epoch": 0.63, "learning_rate": 6.454969031930854e-06, "loss": 1.3967, "step": 22955 }, { "epoch": 0.63, "learning_rate": 6.454141983065727e-06, "loss": 1.3464, "step": 22956 }, { "epoch": 0.63, "learning_rate": 6.453314961941724e-06, "loss": 1.4126, "step": 22957 }, { "epoch": 0.63, "learning_rate": 6.45248796856532e-06, "loss": 1.1882, "step": 22958 }, { "epoch": 0.63, "learning_rate": 6.451661002942977e-06, "loss": 1.3047, "step": 22959 }, { "epoch": 0.63, "learning_rate": 6.450834065081175e-06, "loss": 1.2429, "step": 22960 }, { "epoch": 0.63, "learning_rate": 6.4500071549863745e-06, "loss": 1.0206, "step": 22961 }, { "epoch": 0.63, "learning_rate": 6.449180272665051e-06, "loss": 1.2959, "step": 22962 }, { "epoch": 0.63, "learning_rate": 6.4483534181236695e-06, "loss": 1.155, "step": 22963 }, { "epoch": 0.63, "learning_rate": 6.4475265913687025e-06, "loss": 1.0867, "step": 22964 }, { "epoch": 0.63, "learning_rate": 6.446699792406615e-06, "loss": 1.6929, "step": 22965 }, { "epoch": 0.63, "learning_rate": 6.44587302124388e-06, "loss": 1.1884, "step": 22966 }, { "epoch": 0.63, "learning_rate": 6.4450462778869606e-06, "loss": 1.3049, "step": 22967 }, { "epoch": 0.63, "learning_rate": 6.44421956234233e-06, "loss": 1.3445, "step": 22968 }, { "epoch": 0.63, "learning_rate": 6.443392874616449e-06, "loss": 1.3137, "step": 22969 }, { "epoch": 0.63, "learning_rate": 6.4425662147157915e-06, "loss": 1.2299, "step": 22970 }, { "epoch": 0.63, "learning_rate": 6.441739582646827e-06, "loss": 1.3784, "step": 22971 }, { "epoch": 0.63, "learning_rate": 6.440912978416014e-06, "loss": 1.3738, "step": 22972 }, { "epoch": 0.63, "learning_rate": 6.440086402029828e-06, "loss": 1.178, "step": 22973 }, { "epoch": 0.63, "learning_rate": 6.439259853494729e-06, "loss": 1.2573, "step": 22974 }, { "epoch": 0.63, "learning_rate": 6.438433332817189e-06, "loss": 1.3884, "step": 22975 }, { "epoch": 0.63, "learning_rate": 6.43760684000367e-06, "loss": 1.2539, "step": 22976 }, { "epoch": 0.63, "learning_rate": 6.436780375060643e-06, "loss": 1.2439, "step": 22977 }, { "epoch": 0.63, "learning_rate": 6.4359539379945666e-06, "loss": 1.4082, "step": 22978 }, { "epoch": 0.63, "learning_rate": 6.4351275288119145e-06, "loss": 1.4006, "step": 22979 }, { "epoch": 0.63, "learning_rate": 6.434301147519144e-06, "loss": 1.3049, "step": 22980 }, { "epoch": 0.63, "learning_rate": 6.433474794122729e-06, "loss": 1.3831, "step": 22981 }, { "epoch": 0.63, "learning_rate": 6.432648468629128e-06, "loss": 1.2449, "step": 22982 }, { "epoch": 0.63, "learning_rate": 6.431822171044808e-06, "loss": 1.4517, "step": 22983 }, { "epoch": 0.63, "learning_rate": 6.430995901376234e-06, "loss": 1.3579, "step": 22984 }, { "epoch": 0.63, "learning_rate": 6.430169659629868e-06, "loss": 1.1682, "step": 22985 }, { "epoch": 0.63, "learning_rate": 6.429343445812177e-06, "loss": 1.1255, "step": 22986 }, { "epoch": 0.63, "learning_rate": 6.428517259929623e-06, "loss": 1.2637, "step": 22987 }, { "epoch": 0.63, "learning_rate": 6.427691101988673e-06, "loss": 1.3462, "step": 22988 }, { "epoch": 0.63, "learning_rate": 6.426864971995787e-06, "loss": 1.1333, "step": 22989 }, { "epoch": 0.63, "learning_rate": 6.4260388699574295e-06, "loss": 1.3369, "step": 22990 }, { "epoch": 0.63, "learning_rate": 6.425212795880061e-06, "loss": 1.1494, "step": 22991 }, { "epoch": 0.63, "learning_rate": 6.42438674977015e-06, "loss": 1.2849, "step": 22992 }, { "epoch": 0.63, "learning_rate": 6.423560731634153e-06, "loss": 1.0733, "step": 22993 }, { "epoch": 0.63, "learning_rate": 6.422734741478536e-06, "loss": 1.3232, "step": 22994 }, { "epoch": 0.63, "learning_rate": 6.42190877930976e-06, "loss": 1.2319, "step": 22995 }, { "epoch": 0.63, "learning_rate": 6.421082845134289e-06, "loss": 1.2317, "step": 22996 }, { "epoch": 0.63, "learning_rate": 6.42025693895858e-06, "loss": 1.2629, "step": 22997 }, { "epoch": 0.63, "learning_rate": 6.4194310607891005e-06, "loss": 1.3472, "step": 22998 }, { "epoch": 0.63, "learning_rate": 6.418605210632305e-06, "loss": 1.2468, "step": 22999 }, { "epoch": 0.63, "learning_rate": 6.4177793884946604e-06, "loss": 1.2676, "step": 23000 }, { "epoch": 0.63, "learning_rate": 6.416953594382626e-06, "loss": 1.2798, "step": 23001 }, { "epoch": 0.63, "learning_rate": 6.416127828302658e-06, "loss": 1.304, "step": 23002 }, { "epoch": 0.63, "learning_rate": 6.415302090261226e-06, "loss": 1.4395, "step": 23003 }, { "epoch": 0.63, "learning_rate": 6.41447638026478e-06, "loss": 1.2515, "step": 23004 }, { "epoch": 0.63, "learning_rate": 6.41365069831979e-06, "loss": 1.2734, "step": 23005 }, { "epoch": 0.63, "learning_rate": 6.412825044432705e-06, "loss": 1.425, "step": 23006 }, { "epoch": 0.63, "learning_rate": 6.411999418609995e-06, "loss": 1.2122, "step": 23007 }, { "epoch": 0.63, "learning_rate": 6.41117382085811e-06, "loss": 1.2144, "step": 23008 }, { "epoch": 0.63, "learning_rate": 6.410348251183518e-06, "loss": 1.3638, "step": 23009 }, { "epoch": 0.63, "learning_rate": 6.4095227095926684e-06, "loss": 1.2822, "step": 23010 }, { "epoch": 0.63, "learning_rate": 6.40869719609203e-06, "loss": 1.2402, "step": 23011 }, { "epoch": 0.63, "learning_rate": 6.407871710688049e-06, "loss": 1.1699, "step": 23012 }, { "epoch": 0.63, "learning_rate": 6.407046253387199e-06, "loss": 1.2881, "step": 23013 }, { "epoch": 0.63, "learning_rate": 6.406220824195922e-06, "loss": 1.3582, "step": 23014 }, { "epoch": 0.63, "learning_rate": 6.405395423120686e-06, "loss": 1.3831, "step": 23015 }, { "epoch": 0.63, "learning_rate": 6.404570050167947e-06, "loss": 1.1152, "step": 23016 }, { "epoch": 0.63, "learning_rate": 6.4037447053441606e-06, "loss": 1.3267, "step": 23017 }, { "epoch": 0.63, "learning_rate": 6.402919388655786e-06, "loss": 1.1396, "step": 23018 }, { "epoch": 0.63, "learning_rate": 6.402094100109276e-06, "loss": 1.3728, "step": 23019 }, { "epoch": 0.63, "learning_rate": 6.401268839711092e-06, "loss": 1.1965, "step": 23020 }, { "epoch": 0.63, "learning_rate": 6.400443607467688e-06, "loss": 1.2651, "step": 23021 }, { "epoch": 0.63, "learning_rate": 6.399618403385522e-06, "loss": 1.3601, "step": 23022 }, { "epoch": 0.63, "learning_rate": 6.398793227471045e-06, "loss": 1.2754, "step": 23023 }, { "epoch": 0.63, "learning_rate": 6.397968079730719e-06, "loss": 1.3943, "step": 23024 }, { "epoch": 0.63, "learning_rate": 6.397142960170996e-06, "loss": 1.3813, "step": 23025 }, { "epoch": 0.63, "learning_rate": 6.396317868798333e-06, "loss": 1.2439, "step": 23026 }, { "epoch": 0.63, "learning_rate": 6.395492805619184e-06, "loss": 1.2637, "step": 23027 }, { "epoch": 0.63, "learning_rate": 6.394667770640004e-06, "loss": 1.3132, "step": 23028 }, { "epoch": 0.63, "learning_rate": 6.393842763867248e-06, "loss": 1.3408, "step": 23029 }, { "epoch": 0.63, "learning_rate": 6.393017785307371e-06, "loss": 1.2494, "step": 23030 }, { "epoch": 0.63, "learning_rate": 6.392192834966826e-06, "loss": 1.4106, "step": 23031 }, { "epoch": 0.63, "learning_rate": 6.391367912852067e-06, "loss": 1.1273, "step": 23032 }, { "epoch": 0.63, "learning_rate": 6.39054301896955e-06, "loss": 1.408, "step": 23033 }, { "epoch": 0.63, "learning_rate": 6.389718153325727e-06, "loss": 1.2202, "step": 23034 }, { "epoch": 0.63, "learning_rate": 6.3888933159270525e-06, "loss": 1.2727, "step": 23035 }, { "epoch": 0.63, "learning_rate": 6.3880685067799765e-06, "loss": 1.3303, "step": 23036 }, { "epoch": 0.63, "learning_rate": 6.387243725890957e-06, "loss": 1.2175, "step": 23037 }, { "epoch": 0.63, "learning_rate": 6.38641897326644e-06, "loss": 1.24, "step": 23038 }, { "epoch": 0.63, "learning_rate": 6.385594248912885e-06, "loss": 1.1831, "step": 23039 }, { "epoch": 0.63, "learning_rate": 6.384769552836738e-06, "loss": 1.3484, "step": 23040 }, { "epoch": 0.63, "learning_rate": 6.3839448850444574e-06, "loss": 1.2263, "step": 23041 }, { "epoch": 0.63, "learning_rate": 6.383120245542489e-06, "loss": 1.3311, "step": 23042 }, { "epoch": 0.63, "learning_rate": 6.3822956343372884e-06, "loss": 1.292, "step": 23043 }, { "epoch": 0.63, "learning_rate": 6.381471051435304e-06, "loss": 1.1917, "step": 23044 }, { "epoch": 0.63, "learning_rate": 6.3806464968429905e-06, "loss": 1.3193, "step": 23045 }, { "epoch": 0.63, "learning_rate": 6.379821970566795e-06, "loss": 1.3921, "step": 23046 }, { "epoch": 0.63, "learning_rate": 6.378997472613168e-06, "loss": 1.323, "step": 23047 }, { "epoch": 0.63, "learning_rate": 6.378173002988568e-06, "loss": 1.259, "step": 23048 }, { "epoch": 0.63, "learning_rate": 6.377348561699434e-06, "loss": 1.3792, "step": 23049 }, { "epoch": 0.63, "learning_rate": 6.376524148752227e-06, "loss": 1.2773, "step": 23050 }, { "epoch": 0.63, "learning_rate": 6.375699764153384e-06, "loss": 1.1157, "step": 23051 }, { "epoch": 0.63, "learning_rate": 6.374875407909369e-06, "loss": 1.3718, "step": 23052 }, { "epoch": 0.63, "learning_rate": 6.374051080026619e-06, "loss": 1.1145, "step": 23053 }, { "epoch": 0.63, "learning_rate": 6.373226780511592e-06, "loss": 1.1458, "step": 23054 }, { "epoch": 0.63, "learning_rate": 6.37240250937073e-06, "loss": 1.3459, "step": 23055 }, { "epoch": 0.63, "learning_rate": 6.371578266610489e-06, "loss": 1.4229, "step": 23056 }, { "epoch": 0.63, "learning_rate": 6.370754052237307e-06, "loss": 1.0842, "step": 23057 }, { "epoch": 0.63, "learning_rate": 6.369929866257647e-06, "loss": 1.2188, "step": 23058 }, { "epoch": 0.63, "learning_rate": 6.36910570867794e-06, "loss": 1.3149, "step": 23059 }, { "epoch": 0.63, "learning_rate": 6.36828157950465e-06, "loss": 1.2646, "step": 23060 }, { "epoch": 0.63, "learning_rate": 6.367457478744211e-06, "loss": 1.2029, "step": 23061 }, { "epoch": 0.63, "learning_rate": 6.366633406403079e-06, "loss": 1.4121, "step": 23062 }, { "epoch": 0.63, "learning_rate": 6.3658093624877e-06, "loss": 1.2588, "step": 23063 }, { "epoch": 0.63, "learning_rate": 6.364985347004518e-06, "loss": 1.1892, "step": 23064 }, { "epoch": 0.63, "learning_rate": 6.364161359959984e-06, "loss": 1.2935, "step": 23065 }, { "epoch": 0.63, "learning_rate": 6.363337401360539e-06, "loss": 1.2383, "step": 23066 }, { "epoch": 0.63, "learning_rate": 6.362513471212635e-06, "loss": 1.2307, "step": 23067 }, { "epoch": 0.63, "learning_rate": 6.361689569522711e-06, "loss": 1.4619, "step": 23068 }, { "epoch": 0.63, "learning_rate": 6.36086569629722e-06, "loss": 1.3552, "step": 23069 }, { "epoch": 0.63, "learning_rate": 6.360041851542603e-06, "loss": 1.2202, "step": 23070 }, { "epoch": 0.63, "learning_rate": 6.359218035265309e-06, "loss": 1.4353, "step": 23071 }, { "epoch": 0.63, "learning_rate": 6.358394247471779e-06, "loss": 1.325, "step": 23072 }, { "epoch": 0.63, "learning_rate": 6.357570488168462e-06, "loss": 1.3716, "step": 23073 }, { "epoch": 0.63, "learning_rate": 6.356746757361798e-06, "loss": 1.2944, "step": 23074 }, { "epoch": 0.63, "learning_rate": 6.355923055058238e-06, "loss": 1.3608, "step": 23075 }, { "epoch": 0.63, "learning_rate": 6.355099381264218e-06, "loss": 1.1497, "step": 23076 }, { "epoch": 0.63, "learning_rate": 6.354275735986189e-06, "loss": 1.3271, "step": 23077 }, { "epoch": 0.63, "learning_rate": 6.353452119230592e-06, "loss": 1.2683, "step": 23078 }, { "epoch": 0.63, "learning_rate": 6.35262853100387e-06, "loss": 1.2639, "step": 23079 }, { "epoch": 0.63, "learning_rate": 6.35180497131247e-06, "loss": 1.219, "step": 23080 }, { "epoch": 0.63, "learning_rate": 6.350981440162829e-06, "loss": 1.2673, "step": 23081 }, { "epoch": 0.63, "learning_rate": 6.350157937561396e-06, "loss": 1.3203, "step": 23082 }, { "epoch": 0.63, "learning_rate": 6.349334463514608e-06, "loss": 1.2451, "step": 23083 }, { "epoch": 0.63, "learning_rate": 6.348511018028914e-06, "loss": 1.2166, "step": 23084 }, { "epoch": 0.63, "learning_rate": 6.34768760111075e-06, "loss": 1.2024, "step": 23085 }, { "epoch": 0.63, "learning_rate": 6.346864212766563e-06, "loss": 1.272, "step": 23086 }, { "epoch": 0.63, "learning_rate": 6.346040853002791e-06, "loss": 1.1543, "step": 23087 }, { "epoch": 0.63, "learning_rate": 6.345217521825877e-06, "loss": 1.2463, "step": 23088 }, { "epoch": 0.63, "learning_rate": 6.3443942192422625e-06, "loss": 1.238, "step": 23089 }, { "epoch": 0.63, "learning_rate": 6.3435709452583904e-06, "loss": 1.3171, "step": 23090 }, { "epoch": 0.63, "learning_rate": 6.342747699880698e-06, "loss": 1.2817, "step": 23091 }, { "epoch": 0.63, "learning_rate": 6.341924483115629e-06, "loss": 1.1648, "step": 23092 }, { "epoch": 0.63, "learning_rate": 6.3411012949696215e-06, "loss": 1.3208, "step": 23093 }, { "epoch": 0.63, "learning_rate": 6.340278135449115e-06, "loss": 1.2603, "step": 23094 }, { "epoch": 0.63, "learning_rate": 6.339455004560558e-06, "loss": 1.3, "step": 23095 }, { "epoch": 0.63, "learning_rate": 6.338631902310376e-06, "loss": 1.2036, "step": 23096 }, { "epoch": 0.63, "learning_rate": 6.337808828705024e-06, "loss": 1.3093, "step": 23097 }, { "epoch": 0.63, "learning_rate": 6.336985783750926e-06, "loss": 1.3091, "step": 23098 }, { "epoch": 0.63, "learning_rate": 6.336162767454535e-06, "loss": 1.3723, "step": 23099 }, { "epoch": 0.63, "learning_rate": 6.335339779822278e-06, "loss": 1.2622, "step": 23100 }, { "epoch": 0.63, "learning_rate": 6.3345168208606055e-06, "loss": 1.6094, "step": 23101 }, { "epoch": 0.63, "learning_rate": 6.333693890575945e-06, "loss": 1.2446, "step": 23102 }, { "epoch": 0.63, "learning_rate": 6.3328709889747445e-06, "loss": 1.146, "step": 23103 }, { "epoch": 0.63, "learning_rate": 6.332048116063429e-06, "loss": 1.248, "step": 23104 }, { "epoch": 0.63, "learning_rate": 6.331225271848454e-06, "loss": 1.1111, "step": 23105 }, { "epoch": 0.63, "learning_rate": 6.330402456336237e-06, "loss": 1.3579, "step": 23106 }, { "epoch": 0.63, "learning_rate": 6.3295796695332345e-06, "loss": 1.261, "step": 23107 }, { "epoch": 0.63, "learning_rate": 6.328756911445868e-06, "loss": 1.2446, "step": 23108 }, { "epoch": 0.63, "learning_rate": 6.327934182080584e-06, "loss": 1.1804, "step": 23109 }, { "epoch": 0.63, "learning_rate": 6.327111481443817e-06, "loss": 1.1929, "step": 23110 }, { "epoch": 0.63, "learning_rate": 6.326288809542001e-06, "loss": 1.2247, "step": 23111 }, { "epoch": 0.63, "learning_rate": 6.325466166381577e-06, "loss": 1.2527, "step": 23112 }, { "epoch": 0.63, "learning_rate": 6.324643551968974e-06, "loss": 1.2979, "step": 23113 }, { "epoch": 0.63, "learning_rate": 6.3238209663106345e-06, "loss": 1.1755, "step": 23114 }, { "epoch": 0.63, "learning_rate": 6.3229984094129895e-06, "loss": 1.2581, "step": 23115 }, { "epoch": 0.63, "learning_rate": 6.322175881282477e-06, "loss": 1.2649, "step": 23116 }, { "epoch": 0.63, "learning_rate": 6.321353381925529e-06, "loss": 1.2512, "step": 23117 }, { "epoch": 0.63, "learning_rate": 6.3205309113485844e-06, "loss": 1.2302, "step": 23118 }, { "epoch": 0.63, "learning_rate": 6.319708469558074e-06, "loss": 1.1887, "step": 23119 }, { "epoch": 0.63, "learning_rate": 6.318886056560436e-06, "loss": 1.1704, "step": 23120 }, { "epoch": 0.63, "learning_rate": 6.3180636723621e-06, "loss": 1.313, "step": 23121 }, { "epoch": 0.63, "learning_rate": 6.317241316969506e-06, "loss": 1.2188, "step": 23122 }, { "epoch": 0.63, "learning_rate": 6.31641899038908e-06, "loss": 1.3945, "step": 23123 }, { "epoch": 0.63, "learning_rate": 6.315596692627261e-06, "loss": 1.2659, "step": 23124 }, { "epoch": 0.63, "learning_rate": 6.314774423690484e-06, "loss": 1.2681, "step": 23125 }, { "epoch": 0.63, "learning_rate": 6.313952183585174e-06, "loss": 1.7158, "step": 23126 }, { "epoch": 0.63, "learning_rate": 6.313129972317773e-06, "loss": 1.2314, "step": 23127 }, { "epoch": 0.63, "learning_rate": 6.312307789894707e-06, "loss": 1.1648, "step": 23128 }, { "epoch": 0.63, "learning_rate": 6.311485636322413e-06, "loss": 1.137, "step": 23129 }, { "epoch": 0.63, "learning_rate": 6.310663511607317e-06, "loss": 1.333, "step": 23130 }, { "epoch": 0.63, "learning_rate": 6.309841415755859e-06, "loss": 1.0823, "step": 23131 }, { "epoch": 0.63, "learning_rate": 6.3090193487744655e-06, "loss": 1.3838, "step": 23132 }, { "epoch": 0.63, "learning_rate": 6.308197310669568e-06, "loss": 1.1885, "step": 23133 }, { "epoch": 0.63, "learning_rate": 6.307375301447599e-06, "loss": 1.167, "step": 23134 }, { "epoch": 0.63, "learning_rate": 6.30655332111499e-06, "loss": 1.1882, "step": 23135 }, { "epoch": 0.63, "learning_rate": 6.3057313696781695e-06, "loss": 1.1072, "step": 23136 }, { "epoch": 0.63, "learning_rate": 6.3049094471435726e-06, "loss": 1.3235, "step": 23137 }, { "epoch": 0.63, "learning_rate": 6.304087553517624e-06, "loss": 1.3706, "step": 23138 }, { "epoch": 0.63, "learning_rate": 6.3032656888067535e-06, "loss": 1.2263, "step": 23139 }, { "epoch": 0.63, "learning_rate": 6.3024438530174e-06, "loss": 1.1326, "step": 23140 }, { "epoch": 0.63, "learning_rate": 6.301622046155982e-06, "loss": 1.1804, "step": 23141 }, { "epoch": 0.63, "learning_rate": 6.300800268228939e-06, "loss": 1.3025, "step": 23142 }, { "epoch": 0.63, "learning_rate": 6.29997851924269e-06, "loss": 1.2766, "step": 23143 }, { "epoch": 0.63, "learning_rate": 6.299156799203675e-06, "loss": 1.2166, "step": 23144 }, { "epoch": 0.63, "learning_rate": 6.298335108118311e-06, "loss": 1.3174, "step": 23145 }, { "epoch": 0.63, "learning_rate": 6.297513445993038e-06, "loss": 1.4629, "step": 23146 }, { "epoch": 0.63, "learning_rate": 6.296691812834274e-06, "loss": 1.3281, "step": 23147 }, { "epoch": 0.63, "learning_rate": 6.295870208648457e-06, "loss": 1.4487, "step": 23148 }, { "epoch": 0.63, "learning_rate": 6.2950486334420025e-06, "loss": 1.1235, "step": 23149 }, { "epoch": 0.63, "learning_rate": 6.294227087221354e-06, "loss": 1.281, "step": 23150 }, { "epoch": 0.63, "learning_rate": 6.293405569992922e-06, "loss": 1.3064, "step": 23151 }, { "epoch": 0.63, "learning_rate": 6.292584081763149e-06, "loss": 1.3296, "step": 23152 }, { "epoch": 0.63, "learning_rate": 6.291762622538448e-06, "loss": 1.3135, "step": 23153 }, { "epoch": 0.63, "learning_rate": 6.2909411923252595e-06, "loss": 1.2922, "step": 23154 }, { "epoch": 0.63, "learning_rate": 6.290119791129996e-06, "loss": 1.3135, "step": 23155 }, { "epoch": 0.63, "learning_rate": 6.289298418959092e-06, "loss": 1.2559, "step": 23156 }, { "epoch": 0.63, "learning_rate": 6.288477075818975e-06, "loss": 1.2219, "step": 23157 }, { "epoch": 0.63, "learning_rate": 6.287655761716067e-06, "loss": 1.1382, "step": 23158 }, { "epoch": 0.63, "learning_rate": 6.286834476656796e-06, "loss": 1.0542, "step": 23159 }, { "epoch": 0.63, "learning_rate": 6.286013220647584e-06, "loss": 1.3008, "step": 23160 }, { "epoch": 0.63, "learning_rate": 6.285191993694861e-06, "loss": 1.218, "step": 23161 }, { "epoch": 0.63, "learning_rate": 6.284370795805046e-06, "loss": 1.0752, "step": 23162 }, { "epoch": 0.63, "learning_rate": 6.2835496269845685e-06, "loss": 1.2832, "step": 23163 }, { "epoch": 0.63, "learning_rate": 6.28272848723985e-06, "loss": 1.2869, "step": 23164 }, { "epoch": 0.63, "learning_rate": 6.281907376577316e-06, "loss": 1.4443, "step": 23165 }, { "epoch": 0.63, "learning_rate": 6.281086295003391e-06, "loss": 1.229, "step": 23166 }, { "epoch": 0.63, "learning_rate": 6.2802652425244995e-06, "loss": 1.2905, "step": 23167 }, { "epoch": 0.63, "learning_rate": 6.279444219147059e-06, "loss": 1.3486, "step": 23168 }, { "epoch": 0.63, "learning_rate": 6.278623224877502e-06, "loss": 1.1667, "step": 23169 }, { "epoch": 0.63, "learning_rate": 6.277802259722244e-06, "loss": 1.3354, "step": 23170 }, { "epoch": 0.63, "learning_rate": 6.276981323687712e-06, "loss": 1.2009, "step": 23171 }, { "epoch": 0.63, "learning_rate": 6.276160416780328e-06, "loss": 1.3726, "step": 23172 }, { "epoch": 0.63, "learning_rate": 6.275339539006512e-06, "loss": 1.2166, "step": 23173 }, { "epoch": 0.63, "learning_rate": 6.274518690372691e-06, "loss": 1.3447, "step": 23174 }, { "epoch": 0.63, "learning_rate": 6.273697870885281e-06, "loss": 1.3164, "step": 23175 }, { "epoch": 0.63, "learning_rate": 6.272877080550707e-06, "loss": 1.4028, "step": 23176 }, { "epoch": 0.63, "learning_rate": 6.2720563193753916e-06, "loss": 1.2468, "step": 23177 }, { "epoch": 0.63, "learning_rate": 6.2712355873657546e-06, "loss": 1.2115, "step": 23178 }, { "epoch": 0.63, "learning_rate": 6.270414884528215e-06, "loss": 1.1487, "step": 23179 }, { "epoch": 0.63, "learning_rate": 6.269594210869199e-06, "loss": 1.2036, "step": 23180 }, { "epoch": 0.63, "learning_rate": 6.26877356639512e-06, "loss": 1.3208, "step": 23181 }, { "epoch": 0.63, "learning_rate": 6.267952951112404e-06, "loss": 1.1511, "step": 23182 }, { "epoch": 0.63, "learning_rate": 6.2671323650274685e-06, "loss": 1.7012, "step": 23183 }, { "epoch": 0.63, "learning_rate": 6.266311808146734e-06, "loss": 1.3057, "step": 23184 }, { "epoch": 0.63, "learning_rate": 6.265491280476621e-06, "loss": 1.1792, "step": 23185 }, { "epoch": 0.63, "learning_rate": 6.2646707820235446e-06, "loss": 1.2927, "step": 23186 }, { "epoch": 0.63, "learning_rate": 6.263850312793933e-06, "loss": 1.3293, "step": 23187 }, { "epoch": 0.63, "learning_rate": 6.263029872794195e-06, "loss": 1.2686, "step": 23188 }, { "epoch": 0.63, "learning_rate": 6.26220946203076e-06, "loss": 1.3679, "step": 23189 }, { "epoch": 0.63, "learning_rate": 6.261389080510033e-06, "loss": 1.3721, "step": 23190 }, { "epoch": 0.63, "learning_rate": 6.260568728238447e-06, "loss": 1.3208, "step": 23191 }, { "epoch": 0.63, "learning_rate": 6.259748405222406e-06, "loss": 1.3237, "step": 23192 }, { "epoch": 0.63, "learning_rate": 6.258928111468341e-06, "loss": 1.2415, "step": 23193 }, { "epoch": 0.63, "learning_rate": 6.258107846982658e-06, "loss": 1.3323, "step": 23194 }, { "epoch": 0.63, "learning_rate": 6.257287611771785e-06, "loss": 1.1763, "step": 23195 }, { "epoch": 0.63, "learning_rate": 6.256467405842128e-06, "loss": 1.1956, "step": 23196 }, { "epoch": 0.63, "learning_rate": 6.255647229200116e-06, "loss": 1.3621, "step": 23197 }, { "epoch": 0.63, "learning_rate": 6.2548270818521525e-06, "loss": 1.3125, "step": 23198 }, { "epoch": 0.63, "learning_rate": 6.254006963804667e-06, "loss": 1.2603, "step": 23199 }, { "epoch": 0.63, "learning_rate": 6.253186875064064e-06, "loss": 1.197, "step": 23200 }, { "epoch": 0.63, "learning_rate": 6.252366815636768e-06, "loss": 1.3323, "step": 23201 }, { "epoch": 0.63, "learning_rate": 6.251546785529192e-06, "loss": 1.2446, "step": 23202 }, { "epoch": 0.63, "learning_rate": 6.25072678474775e-06, "loss": 1.3525, "step": 23203 }, { "epoch": 0.63, "learning_rate": 6.2499068132988605e-06, "loss": 1.1382, "step": 23204 }, { "epoch": 0.63, "learning_rate": 6.2490868711889344e-06, "loss": 1.1021, "step": 23205 }, { "epoch": 0.63, "learning_rate": 6.248266958424391e-06, "loss": 1.354, "step": 23206 }, { "epoch": 0.63, "learning_rate": 6.247447075011641e-06, "loss": 1.3674, "step": 23207 }, { "epoch": 0.63, "learning_rate": 6.246627220957102e-06, "loss": 1.3809, "step": 23208 }, { "epoch": 0.63, "learning_rate": 6.245807396267186e-06, "loss": 1.3745, "step": 23209 }, { "epoch": 0.63, "learning_rate": 6.244987600948309e-06, "loss": 1.2996, "step": 23210 }, { "epoch": 0.63, "learning_rate": 6.24416783500688e-06, "loss": 1.2979, "step": 23211 }, { "epoch": 0.63, "learning_rate": 6.24334809844932e-06, "loss": 1.314, "step": 23212 }, { "epoch": 0.63, "learning_rate": 6.242528391282034e-06, "loss": 1.2917, "step": 23213 }, { "epoch": 0.63, "learning_rate": 6.241708713511441e-06, "loss": 1.2717, "step": 23214 }, { "epoch": 0.63, "learning_rate": 6.240889065143951e-06, "loss": 1.2742, "step": 23215 }, { "epoch": 0.63, "learning_rate": 6.240069446185979e-06, "loss": 1.3291, "step": 23216 }, { "epoch": 0.63, "learning_rate": 6.239249856643932e-06, "loss": 1.2898, "step": 23217 }, { "epoch": 0.63, "learning_rate": 6.238430296524227e-06, "loss": 1.3057, "step": 23218 }, { "epoch": 0.63, "learning_rate": 6.237610765833277e-06, "loss": 1.3147, "step": 23219 }, { "epoch": 0.63, "learning_rate": 6.236791264577488e-06, "loss": 1.1682, "step": 23220 }, { "epoch": 0.63, "learning_rate": 6.235971792763278e-06, "loss": 1.1689, "step": 23221 }, { "epoch": 0.63, "learning_rate": 6.235152350397051e-06, "loss": 1.2996, "step": 23222 }, { "epoch": 0.63, "learning_rate": 6.2343329374852255e-06, "loss": 1.7085, "step": 23223 }, { "epoch": 0.63, "learning_rate": 6.233513554034205e-06, "loss": 1.2349, "step": 23224 }, { "epoch": 0.63, "learning_rate": 6.232694200050407e-06, "loss": 1.3896, "step": 23225 }, { "epoch": 0.63, "learning_rate": 6.231874875540233e-06, "loss": 1.4565, "step": 23226 }, { "epoch": 0.63, "learning_rate": 6.231055580510103e-06, "loss": 1.1599, "step": 23227 }, { "epoch": 0.63, "learning_rate": 6.230236314966419e-06, "loss": 1.2825, "step": 23228 }, { "epoch": 0.63, "learning_rate": 6.229417078915595e-06, "loss": 1.2705, "step": 23229 }, { "epoch": 0.63, "learning_rate": 6.228597872364037e-06, "loss": 1.2454, "step": 23230 }, { "epoch": 0.63, "learning_rate": 6.2277786953181585e-06, "loss": 1.1902, "step": 23231 }, { "epoch": 0.63, "learning_rate": 6.22695954778436e-06, "loss": 1.2856, "step": 23232 }, { "epoch": 0.63, "learning_rate": 6.226140429769059e-06, "loss": 1.3374, "step": 23233 }, { "epoch": 0.63, "learning_rate": 6.2253213412786626e-06, "loss": 1.3713, "step": 23234 }, { "epoch": 0.63, "learning_rate": 6.224502282319574e-06, "loss": 1.7646, "step": 23235 }, { "epoch": 0.63, "learning_rate": 6.223683252898207e-06, "loss": 1.3264, "step": 23236 }, { "epoch": 0.63, "learning_rate": 6.222864253020965e-06, "loss": 1.3328, "step": 23237 }, { "epoch": 0.63, "learning_rate": 6.222045282694258e-06, "loss": 1.1753, "step": 23238 }, { "epoch": 0.63, "learning_rate": 6.221226341924491e-06, "loss": 1.3352, "step": 23239 }, { "epoch": 0.63, "learning_rate": 6.220407430718074e-06, "loss": 1.2883, "step": 23240 }, { "epoch": 0.63, "learning_rate": 6.2195885490814104e-06, "loss": 1.2534, "step": 23241 }, { "epoch": 0.63, "learning_rate": 6.218769697020909e-06, "loss": 1.2561, "step": 23242 }, { "epoch": 0.63, "learning_rate": 6.217950874542974e-06, "loss": 1.2463, "step": 23243 }, { "epoch": 0.63, "learning_rate": 6.2171320816540144e-06, "loss": 1.2542, "step": 23244 }, { "epoch": 0.63, "learning_rate": 6.216313318360434e-06, "loss": 1.1108, "step": 23245 }, { "epoch": 0.63, "learning_rate": 6.21549458466864e-06, "loss": 1.334, "step": 23246 }, { "epoch": 0.63, "learning_rate": 6.214675880585035e-06, "loss": 1.3362, "step": 23247 }, { "epoch": 0.63, "learning_rate": 6.213857206116025e-06, "loss": 1.2104, "step": 23248 }, { "epoch": 0.63, "learning_rate": 6.213038561268019e-06, "loss": 1.3101, "step": 23249 }, { "epoch": 0.63, "learning_rate": 6.2122199460474175e-06, "loss": 1.4878, "step": 23250 }, { "epoch": 0.63, "learning_rate": 6.211401360460626e-06, "loss": 1.4185, "step": 23251 }, { "epoch": 0.63, "learning_rate": 6.210582804514047e-06, "loss": 1.2031, "step": 23252 }, { "epoch": 0.64, "learning_rate": 6.20976427821409e-06, "loss": 1.2778, "step": 23253 }, { "epoch": 0.64, "learning_rate": 6.20894578156715e-06, "loss": 1.2024, "step": 23254 }, { "epoch": 0.64, "learning_rate": 6.2081273145796396e-06, "loss": 1.3293, "step": 23255 }, { "epoch": 0.64, "learning_rate": 6.207308877257956e-06, "loss": 1.2922, "step": 23256 }, { "epoch": 0.64, "learning_rate": 6.206490469608506e-06, "loss": 1.665, "step": 23257 }, { "epoch": 0.64, "learning_rate": 6.205672091637689e-06, "loss": 1.293, "step": 23258 }, { "epoch": 0.64, "learning_rate": 6.204853743351911e-06, "loss": 1.3989, "step": 23259 }, { "epoch": 0.64, "learning_rate": 6.204035424757571e-06, "loss": 1.3184, "step": 23260 }, { "epoch": 0.64, "learning_rate": 6.203217135861075e-06, "loss": 1.416, "step": 23261 }, { "epoch": 0.64, "learning_rate": 6.2023988766688204e-06, "loss": 1.3105, "step": 23262 }, { "epoch": 0.64, "learning_rate": 6.201580647187211e-06, "loss": 1.3687, "step": 23263 }, { "epoch": 0.64, "learning_rate": 6.200762447422651e-06, "loss": 1.2974, "step": 23264 }, { "epoch": 0.64, "learning_rate": 6.199944277381533e-06, "loss": 1.4165, "step": 23265 }, { "epoch": 0.64, "learning_rate": 6.199126137070272e-06, "loss": 1.2915, "step": 23266 }, { "epoch": 0.64, "learning_rate": 6.198308026495256e-06, "loss": 1.2725, "step": 23267 }, { "epoch": 0.64, "learning_rate": 6.1974899456628946e-06, "loss": 1.3093, "step": 23268 }, { "epoch": 0.64, "learning_rate": 6.1966718945795774e-06, "loss": 1.074, "step": 23269 }, { "epoch": 0.64, "learning_rate": 6.195853873251718e-06, "loss": 1.2158, "step": 23270 }, { "epoch": 0.64, "learning_rate": 6.195035881685703e-06, "loss": 1.1499, "step": 23271 }, { "epoch": 0.64, "learning_rate": 6.194217919887944e-06, "loss": 1.3679, "step": 23272 }, { "epoch": 0.64, "learning_rate": 6.193399987864827e-06, "loss": 1.3528, "step": 23273 }, { "epoch": 0.64, "learning_rate": 6.192582085622766e-06, "loss": 1.2999, "step": 23274 }, { "epoch": 0.64, "learning_rate": 6.191764213168146e-06, "loss": 1.2202, "step": 23275 }, { "epoch": 0.64, "learning_rate": 6.190946370507378e-06, "loss": 1.2744, "step": 23276 }, { "epoch": 0.64, "learning_rate": 6.190128557646848e-06, "loss": 1.3765, "step": 23277 }, { "epoch": 0.64, "learning_rate": 6.189310774592967e-06, "loss": 1.2336, "step": 23278 }, { "epoch": 0.64, "learning_rate": 6.188493021352121e-06, "loss": 1.2314, "step": 23279 }, { "epoch": 0.64, "learning_rate": 6.187675297930715e-06, "loss": 1.2236, "step": 23280 }, { "epoch": 0.64, "learning_rate": 6.186857604335147e-06, "loss": 1.188, "step": 23281 }, { "epoch": 0.64, "learning_rate": 6.186039940571809e-06, "loss": 1.2654, "step": 23282 }, { "epoch": 0.64, "learning_rate": 6.185222306647105e-06, "loss": 1.2244, "step": 23283 }, { "epoch": 0.64, "learning_rate": 6.184404702567424e-06, "loss": 1.6973, "step": 23284 }, { "epoch": 0.64, "learning_rate": 6.18358712833917e-06, "loss": 1.3557, "step": 23285 }, { "epoch": 0.64, "learning_rate": 6.182769583968733e-06, "loss": 1.1487, "step": 23286 }, { "epoch": 0.64, "learning_rate": 6.181952069462514e-06, "loss": 1.1716, "step": 23287 }, { "epoch": 0.64, "learning_rate": 6.181134584826903e-06, "loss": 1.0029, "step": 23288 }, { "epoch": 0.64, "learning_rate": 6.180317130068303e-06, "loss": 1.4055, "step": 23289 }, { "epoch": 0.64, "learning_rate": 6.179499705193102e-06, "loss": 1.3125, "step": 23290 }, { "epoch": 0.64, "learning_rate": 6.178682310207702e-06, "loss": 1.4512, "step": 23291 }, { "epoch": 0.64, "learning_rate": 6.177864945118492e-06, "loss": 1.4333, "step": 23292 }, { "epoch": 0.64, "learning_rate": 6.177047609931873e-06, "loss": 1.3232, "step": 23293 }, { "epoch": 0.64, "learning_rate": 6.176230304654234e-06, "loss": 1.2095, "step": 23294 }, { "epoch": 0.64, "learning_rate": 6.175413029291969e-06, "loss": 1.2874, "step": 23295 }, { "epoch": 0.64, "learning_rate": 6.174595783851476e-06, "loss": 1.1816, "step": 23296 }, { "epoch": 0.64, "learning_rate": 6.173778568339146e-06, "loss": 1.3184, "step": 23297 }, { "epoch": 0.64, "learning_rate": 6.172961382761376e-06, "loss": 1.1597, "step": 23298 }, { "epoch": 0.64, "learning_rate": 6.172144227124552e-06, "loss": 1.3381, "step": 23299 }, { "epoch": 0.64, "learning_rate": 6.171327101435076e-06, "loss": 1.2593, "step": 23300 }, { "epoch": 0.64, "learning_rate": 6.170510005699333e-06, "loss": 1.2676, "step": 23301 }, { "epoch": 0.64, "learning_rate": 6.169692939923722e-06, "loss": 1.1646, "step": 23302 }, { "epoch": 0.64, "learning_rate": 6.168875904114628e-06, "loss": 1.2317, "step": 23303 }, { "epoch": 0.64, "learning_rate": 6.168058898278452e-06, "loss": 1.2737, "step": 23304 }, { "epoch": 0.64, "learning_rate": 6.167241922421579e-06, "loss": 1.2798, "step": 23305 }, { "epoch": 0.64, "learning_rate": 6.166424976550404e-06, "loss": 1.2393, "step": 23306 }, { "epoch": 0.64, "learning_rate": 6.165608060671315e-06, "loss": 1.7153, "step": 23307 }, { "epoch": 0.64, "learning_rate": 6.164791174790707e-06, "loss": 1.4075, "step": 23308 }, { "epoch": 0.64, "learning_rate": 6.163974318914969e-06, "loss": 1.2158, "step": 23309 }, { "epoch": 0.64, "learning_rate": 6.163157493050489e-06, "loss": 1.2625, "step": 23310 }, { "epoch": 0.64, "learning_rate": 6.162340697203668e-06, "loss": 1.4285, "step": 23311 }, { "epoch": 0.64, "learning_rate": 6.161523931380882e-06, "loss": 1.1592, "step": 23312 }, { "epoch": 0.64, "learning_rate": 6.160707195588533e-06, "loss": 1.2776, "step": 23313 }, { "epoch": 0.64, "learning_rate": 6.159890489833e-06, "loss": 1.2375, "step": 23314 }, { "epoch": 0.64, "learning_rate": 6.159073814120684e-06, "loss": 1.1733, "step": 23315 }, { "epoch": 0.64, "learning_rate": 6.158257168457964e-06, "loss": 1.2461, "step": 23316 }, { "epoch": 0.64, "learning_rate": 6.157440552851237e-06, "loss": 1.0854, "step": 23317 }, { "epoch": 0.64, "learning_rate": 6.1566239673068824e-06, "loss": 1.3157, "step": 23318 }, { "epoch": 0.64, "learning_rate": 6.155807411831303e-06, "loss": 1.4856, "step": 23319 }, { "epoch": 0.64, "learning_rate": 6.15499088643087e-06, "loss": 1.3164, "step": 23320 }, { "epoch": 0.64, "learning_rate": 6.154174391111989e-06, "loss": 0.9878, "step": 23321 }, { "epoch": 0.64, "learning_rate": 6.15335792588103e-06, "loss": 1.3738, "step": 23322 }, { "epoch": 0.64, "learning_rate": 6.152541490744398e-06, "loss": 1.0504, "step": 23323 }, { "epoch": 0.64, "learning_rate": 6.151725085708465e-06, "loss": 1.4065, "step": 23324 }, { "epoch": 0.64, "learning_rate": 6.150908710779628e-06, "loss": 1.2222, "step": 23325 }, { "epoch": 0.64, "learning_rate": 6.150092365964273e-06, "loss": 1.4331, "step": 23326 }, { "epoch": 0.64, "learning_rate": 6.149276051268783e-06, "loss": 1.1782, "step": 23327 }, { "epoch": 0.64, "learning_rate": 6.148459766699548e-06, "loss": 1.2075, "step": 23328 }, { "epoch": 0.64, "learning_rate": 6.147643512262953e-06, "loss": 1.248, "step": 23329 }, { "epoch": 0.64, "learning_rate": 6.146827287965383e-06, "loss": 1.5605, "step": 23330 }, { "epoch": 0.64, "learning_rate": 6.146011093813223e-06, "loss": 1.2566, "step": 23331 }, { "epoch": 0.64, "learning_rate": 6.145194929812863e-06, "loss": 1.2478, "step": 23332 }, { "epoch": 0.64, "learning_rate": 6.144378795970682e-06, "loss": 1.3325, "step": 23333 }, { "epoch": 0.64, "learning_rate": 6.1435626922930706e-06, "loss": 1.2354, "step": 23334 }, { "epoch": 0.64, "learning_rate": 6.142746618786409e-06, "loss": 1.1794, "step": 23335 }, { "epoch": 0.64, "learning_rate": 6.141930575457087e-06, "loss": 1.2666, "step": 23336 }, { "epoch": 0.64, "learning_rate": 6.141114562311483e-06, "loss": 1.4209, "step": 23337 }, { "epoch": 0.64, "learning_rate": 6.1402985793559854e-06, "loss": 1.3301, "step": 23338 }, { "epoch": 0.64, "learning_rate": 6.139482626596977e-06, "loss": 1.0643, "step": 23339 }, { "epoch": 0.64, "learning_rate": 6.138666704040841e-06, "loss": 1.2227, "step": 23340 }, { "epoch": 0.64, "learning_rate": 6.13785081169396e-06, "loss": 0.976, "step": 23341 }, { "epoch": 0.64, "learning_rate": 6.137034949562719e-06, "loss": 1.052, "step": 23342 }, { "epoch": 0.64, "learning_rate": 6.136219117653502e-06, "loss": 1.2646, "step": 23343 }, { "epoch": 0.64, "learning_rate": 6.135403315972685e-06, "loss": 1.2661, "step": 23344 }, { "epoch": 0.64, "learning_rate": 6.13458754452666e-06, "loss": 1.3848, "step": 23345 }, { "epoch": 0.64, "learning_rate": 6.133771803321802e-06, "loss": 1.3174, "step": 23346 }, { "epoch": 0.64, "learning_rate": 6.132956092364497e-06, "loss": 1.2778, "step": 23347 }, { "epoch": 0.64, "learning_rate": 6.132140411661123e-06, "loss": 1.3657, "step": 23348 }, { "epoch": 0.64, "learning_rate": 6.131324761218065e-06, "loss": 1.7617, "step": 23349 }, { "epoch": 0.64, "learning_rate": 6.130509141041702e-06, "loss": 1.2515, "step": 23350 }, { "epoch": 0.64, "learning_rate": 6.129693551138417e-06, "loss": 1.2, "step": 23351 }, { "epoch": 0.64, "learning_rate": 6.128877991514588e-06, "loss": 1.2129, "step": 23352 }, { "epoch": 0.64, "learning_rate": 6.128062462176599e-06, "loss": 1.3042, "step": 23353 }, { "epoch": 0.64, "learning_rate": 6.127246963130827e-06, "loss": 1.3337, "step": 23354 }, { "epoch": 0.64, "learning_rate": 6.1264314943836555e-06, "loss": 1.4194, "step": 23355 }, { "epoch": 0.64, "learning_rate": 6.125616055941462e-06, "loss": 1.3081, "step": 23356 }, { "epoch": 0.64, "learning_rate": 6.124800647810623e-06, "loss": 1.2827, "step": 23357 }, { "epoch": 0.64, "learning_rate": 6.123985269997528e-06, "loss": 1.3352, "step": 23358 }, { "epoch": 0.64, "learning_rate": 6.1231699225085425e-06, "loss": 1.2749, "step": 23359 }, { "epoch": 0.64, "learning_rate": 6.1223546053500605e-06, "loss": 1.2864, "step": 23360 }, { "epoch": 0.64, "learning_rate": 6.121539318528445e-06, "loss": 1.2571, "step": 23361 }, { "epoch": 0.64, "learning_rate": 6.120724062050088e-06, "loss": 1.3899, "step": 23362 }, { "epoch": 0.64, "learning_rate": 6.119908835921356e-06, "loss": 1.3445, "step": 23363 }, { "epoch": 0.64, "learning_rate": 6.11909364014864e-06, "loss": 1.3232, "step": 23364 }, { "epoch": 0.64, "learning_rate": 6.1182784747383036e-06, "loss": 1.2656, "step": 23365 }, { "epoch": 0.64, "learning_rate": 6.117463339696737e-06, "loss": 1.2432, "step": 23366 }, { "epoch": 0.64, "learning_rate": 6.116648235030306e-06, "loss": 1.3435, "step": 23367 }, { "epoch": 0.64, "learning_rate": 6.115833160745399e-06, "loss": 1.1831, "step": 23368 }, { "epoch": 0.64, "learning_rate": 6.1150181168483805e-06, "loss": 1.2695, "step": 23369 }, { "epoch": 0.64, "learning_rate": 6.114203103345639e-06, "loss": 1.3713, "step": 23370 }, { "epoch": 0.64, "learning_rate": 6.11338812024354e-06, "loss": 1.2463, "step": 23371 }, { "epoch": 0.64, "learning_rate": 6.112573167548466e-06, "loss": 1.2324, "step": 23372 }, { "epoch": 0.64, "learning_rate": 6.111758245266795e-06, "loss": 1.3281, "step": 23373 }, { "epoch": 0.64, "learning_rate": 6.110943353404895e-06, "loss": 1.2041, "step": 23374 }, { "epoch": 0.64, "learning_rate": 6.110128491969149e-06, "loss": 1.3657, "step": 23375 }, { "epoch": 0.64, "learning_rate": 6.109313660965925e-06, "loss": 1.2705, "step": 23376 }, { "epoch": 0.64, "learning_rate": 6.108498860401606e-06, "loss": 1.1946, "step": 23377 }, { "epoch": 0.64, "learning_rate": 6.107684090282557e-06, "loss": 1.3511, "step": 23378 }, { "epoch": 0.64, "learning_rate": 6.106869350615161e-06, "loss": 1.0885, "step": 23379 }, { "epoch": 0.64, "learning_rate": 6.106054641405787e-06, "loss": 1.1853, "step": 23380 }, { "epoch": 0.64, "learning_rate": 6.105239962660811e-06, "loss": 1.3452, "step": 23381 }, { "epoch": 0.64, "learning_rate": 6.104425314386606e-06, "loss": 1.3206, "step": 23382 }, { "epoch": 0.64, "learning_rate": 6.103610696589546e-06, "loss": 1.2942, "step": 23383 }, { "epoch": 0.64, "learning_rate": 6.102796109276003e-06, "loss": 1.3137, "step": 23384 }, { "epoch": 0.64, "learning_rate": 6.101981552452352e-06, "loss": 1.335, "step": 23385 }, { "epoch": 0.64, "learning_rate": 6.101167026124961e-06, "loss": 1.2668, "step": 23386 }, { "epoch": 0.64, "learning_rate": 6.100352530300207e-06, "loss": 1.3223, "step": 23387 }, { "epoch": 0.64, "learning_rate": 6.099538064984463e-06, "loss": 1.3708, "step": 23388 }, { "epoch": 0.64, "learning_rate": 6.098723630184098e-06, "loss": 1.3162, "step": 23389 }, { "epoch": 0.64, "learning_rate": 6.097909225905485e-06, "loss": 1.2437, "step": 23390 }, { "epoch": 0.64, "learning_rate": 6.097094852154994e-06, "loss": 1.4602, "step": 23391 }, { "epoch": 0.64, "learning_rate": 6.096280508939e-06, "loss": 1.281, "step": 23392 }, { "epoch": 0.64, "learning_rate": 6.0954661962638695e-06, "loss": 1.313, "step": 23393 }, { "epoch": 0.64, "learning_rate": 6.094651914135977e-06, "loss": 1.1914, "step": 23394 }, { "epoch": 0.64, "learning_rate": 6.09383766256169e-06, "loss": 1.2365, "step": 23395 }, { "epoch": 0.64, "learning_rate": 6.093023441547383e-06, "loss": 1.3613, "step": 23396 }, { "epoch": 0.64, "learning_rate": 6.09220925109942e-06, "loss": 1.4502, "step": 23397 }, { "epoch": 0.64, "learning_rate": 6.091395091224177e-06, "loss": 1.0732, "step": 23398 }, { "epoch": 0.64, "learning_rate": 6.090580961928019e-06, "loss": 1.3218, "step": 23399 }, { "epoch": 0.64, "learning_rate": 6.089766863217319e-06, "loss": 1.4216, "step": 23400 }, { "epoch": 0.64, "learning_rate": 6.088952795098442e-06, "loss": 1.2979, "step": 23401 }, { "epoch": 0.64, "learning_rate": 6.088138757577762e-06, "loss": 1.199, "step": 23402 }, { "epoch": 0.64, "learning_rate": 6.0873247506616415e-06, "loss": 1.2009, "step": 23403 }, { "epoch": 0.64, "learning_rate": 6.086510774356451e-06, "loss": 1.3799, "step": 23404 }, { "epoch": 0.64, "learning_rate": 6.085696828668566e-06, "loss": 1.2759, "step": 23405 }, { "epoch": 0.64, "learning_rate": 6.084882913604342e-06, "loss": 1.3677, "step": 23406 }, { "epoch": 0.64, "learning_rate": 6.0840690291701606e-06, "loss": 1.3782, "step": 23407 }, { "epoch": 0.64, "learning_rate": 6.083255175372373e-06, "loss": 1.2866, "step": 23408 }, { "epoch": 0.64, "learning_rate": 6.082441352217364e-06, "loss": 1.3721, "step": 23409 }, { "epoch": 0.64, "learning_rate": 6.081627559711485e-06, "loss": 1.3406, "step": 23410 }, { "epoch": 0.64, "learning_rate": 6.0808137978611134e-06, "loss": 1.251, "step": 23411 }, { "epoch": 0.64, "learning_rate": 6.080000066672608e-06, "loss": 1.2681, "step": 23412 }, { "epoch": 0.64, "learning_rate": 6.079186366152344e-06, "loss": 1.3823, "step": 23413 }, { "epoch": 0.64, "learning_rate": 6.078372696306676e-06, "loss": 1.3457, "step": 23414 }, { "epoch": 0.64, "learning_rate": 6.0775590571419814e-06, "loss": 1.332, "step": 23415 }, { "epoch": 0.64, "learning_rate": 6.076745448664616e-06, "loss": 1.4214, "step": 23416 }, { "epoch": 0.64, "learning_rate": 6.0759318708809536e-06, "loss": 1.3481, "step": 23417 }, { "epoch": 0.64, "learning_rate": 6.075118323797351e-06, "loss": 1.2551, "step": 23418 }, { "epoch": 0.64, "learning_rate": 6.074304807420177e-06, "loss": 1.425, "step": 23419 }, { "epoch": 0.64, "learning_rate": 6.073491321755799e-06, "loss": 1.3052, "step": 23420 }, { "epoch": 0.64, "learning_rate": 6.072677866810577e-06, "loss": 1.176, "step": 23421 }, { "epoch": 0.64, "learning_rate": 6.071864442590878e-06, "loss": 1.3442, "step": 23422 }, { "epoch": 0.64, "learning_rate": 6.071051049103063e-06, "loss": 1.1794, "step": 23423 }, { "epoch": 0.64, "learning_rate": 6.070237686353497e-06, "loss": 1.2383, "step": 23424 }, { "epoch": 0.64, "learning_rate": 6.069424354348543e-06, "loss": 1.3628, "step": 23425 }, { "epoch": 0.64, "learning_rate": 6.068611053094568e-06, "loss": 1.314, "step": 23426 }, { "epoch": 0.64, "learning_rate": 6.067797782597928e-06, "loss": 1.3359, "step": 23427 }, { "epoch": 0.64, "learning_rate": 6.066984542864991e-06, "loss": 1.2068, "step": 23428 }, { "epoch": 0.64, "learning_rate": 6.066171333902115e-06, "loss": 1.2332, "step": 23429 }, { "epoch": 0.64, "learning_rate": 6.065358155715668e-06, "loss": 1.2688, "step": 23430 }, { "epoch": 0.64, "learning_rate": 6.064545008312006e-06, "loss": 1.2366, "step": 23431 }, { "epoch": 0.64, "learning_rate": 6.063731891697495e-06, "loss": 1.2947, "step": 23432 }, { "epoch": 0.64, "learning_rate": 6.062918805878493e-06, "loss": 1.3506, "step": 23433 }, { "epoch": 0.64, "learning_rate": 6.062105750861362e-06, "loss": 1.2156, "step": 23434 }, { "epoch": 0.64, "learning_rate": 6.061292726652468e-06, "loss": 1.2742, "step": 23435 }, { "epoch": 0.64, "learning_rate": 6.0604797332581645e-06, "loss": 1.1538, "step": 23436 }, { "epoch": 0.64, "learning_rate": 6.059666770684815e-06, "loss": 1.3604, "step": 23437 }, { "epoch": 0.64, "learning_rate": 6.05885383893878e-06, "loss": 1.2161, "step": 23438 }, { "epoch": 0.64, "learning_rate": 6.058040938026422e-06, "loss": 1.1792, "step": 23439 }, { "epoch": 0.64, "learning_rate": 6.057228067954095e-06, "loss": 1.1755, "step": 23440 }, { "epoch": 0.64, "learning_rate": 6.056415228728163e-06, "loss": 1.2832, "step": 23441 }, { "epoch": 0.64, "learning_rate": 6.055602420354982e-06, "loss": 1.3096, "step": 23442 }, { "epoch": 0.64, "learning_rate": 6.054789642840917e-06, "loss": 1.2937, "step": 23443 }, { "epoch": 0.64, "learning_rate": 6.053976896192319e-06, "loss": 1.3669, "step": 23444 }, { "epoch": 0.64, "learning_rate": 6.053164180415552e-06, "loss": 1.1963, "step": 23445 }, { "epoch": 0.64, "learning_rate": 6.05235149551697e-06, "loss": 1.1797, "step": 23446 }, { "epoch": 0.64, "learning_rate": 6.051538841502938e-06, "loss": 1.3518, "step": 23447 }, { "epoch": 0.64, "learning_rate": 6.050726218379804e-06, "loss": 1.1306, "step": 23448 }, { "epoch": 0.64, "learning_rate": 6.049913626153932e-06, "loss": 1.2639, "step": 23449 }, { "epoch": 0.64, "learning_rate": 6.049101064831682e-06, "loss": 1.25, "step": 23450 }, { "epoch": 0.64, "learning_rate": 6.048288534419403e-06, "loss": 1.2208, "step": 23451 }, { "epoch": 0.64, "learning_rate": 6.047476034923462e-06, "loss": 1.2656, "step": 23452 }, { "epoch": 0.64, "learning_rate": 6.0466635663502035e-06, "loss": 1.2861, "step": 23453 }, { "epoch": 0.64, "learning_rate": 6.045851128705997e-06, "loss": 1.3198, "step": 23454 }, { "epoch": 0.64, "learning_rate": 6.0450387219971855e-06, "loss": 1.345, "step": 23455 }, { "epoch": 0.64, "learning_rate": 6.0442263462301365e-06, "loss": 1.2253, "step": 23456 }, { "epoch": 0.64, "learning_rate": 6.0434140014111946e-06, "loss": 1.3809, "step": 23457 }, { "epoch": 0.64, "learning_rate": 6.042601687546728e-06, "loss": 1.687, "step": 23458 }, { "epoch": 0.64, "learning_rate": 6.041789404643078e-06, "loss": 1.3472, "step": 23459 }, { "epoch": 0.64, "learning_rate": 6.040977152706613e-06, "loss": 1.6099, "step": 23460 }, { "epoch": 0.64, "learning_rate": 6.040164931743675e-06, "loss": 1.2844, "step": 23461 }, { "epoch": 0.64, "learning_rate": 6.03935274176063e-06, "loss": 1.1248, "step": 23462 }, { "epoch": 0.64, "learning_rate": 6.038540582763821e-06, "loss": 1.2644, "step": 23463 }, { "epoch": 0.64, "learning_rate": 6.037728454759612e-06, "loss": 1.1536, "step": 23464 }, { "epoch": 0.64, "learning_rate": 6.03691635775435e-06, "loss": 1.3413, "step": 23465 }, { "epoch": 0.64, "learning_rate": 6.036104291754392e-06, "loss": 1.3413, "step": 23466 }, { "epoch": 0.64, "learning_rate": 6.03529225676609e-06, "loss": 1.3779, "step": 23467 }, { "epoch": 0.64, "learning_rate": 6.034480252795797e-06, "loss": 1.2656, "step": 23468 }, { "epoch": 0.64, "learning_rate": 6.033668279849867e-06, "loss": 1.2332, "step": 23469 }, { "epoch": 0.64, "learning_rate": 6.03285633793465e-06, "loss": 1.2737, "step": 23470 }, { "epoch": 0.64, "learning_rate": 6.0320444270565e-06, "loss": 1.498, "step": 23471 }, { "epoch": 0.64, "learning_rate": 6.031232547221767e-06, "loss": 1.1614, "step": 23472 }, { "epoch": 0.64, "learning_rate": 6.0304206984368075e-06, "loss": 1.0745, "step": 23473 }, { "epoch": 0.64, "learning_rate": 6.029608880707967e-06, "loss": 1.2549, "step": 23474 }, { "epoch": 0.64, "learning_rate": 6.028797094041601e-06, "loss": 1.2385, "step": 23475 }, { "epoch": 0.64, "learning_rate": 6.0279853384440575e-06, "loss": 1.2563, "step": 23476 }, { "epoch": 0.64, "learning_rate": 6.027173613921691e-06, "loss": 1.3745, "step": 23477 }, { "epoch": 0.64, "learning_rate": 6.0263619204808474e-06, "loss": 1.3057, "step": 23478 }, { "epoch": 0.64, "learning_rate": 6.0255502581278835e-06, "loss": 1.1704, "step": 23479 }, { "epoch": 0.64, "learning_rate": 6.0247386268691424e-06, "loss": 1.2573, "step": 23480 }, { "epoch": 0.64, "learning_rate": 6.023927026710976e-06, "loss": 1.2891, "step": 23481 }, { "epoch": 0.64, "learning_rate": 6.023115457659738e-06, "loss": 1.3228, "step": 23482 }, { "epoch": 0.64, "learning_rate": 6.022303919721772e-06, "loss": 1.0398, "step": 23483 }, { "epoch": 0.64, "learning_rate": 6.0214924129034325e-06, "loss": 1.3008, "step": 23484 }, { "epoch": 0.64, "learning_rate": 6.020680937211063e-06, "loss": 1.2212, "step": 23485 }, { "epoch": 0.64, "learning_rate": 6.019869492651016e-06, "loss": 1.2891, "step": 23486 }, { "epoch": 0.64, "learning_rate": 6.019058079229638e-06, "loss": 1.4392, "step": 23487 }, { "epoch": 0.64, "learning_rate": 6.018246696953278e-06, "loss": 1.7402, "step": 23488 }, { "epoch": 0.64, "learning_rate": 6.017435345828282e-06, "loss": 1.1885, "step": 23489 }, { "epoch": 0.64, "learning_rate": 6.016624025861002e-06, "loss": 1.3582, "step": 23490 }, { "epoch": 0.64, "learning_rate": 6.01581273705778e-06, "loss": 1.2229, "step": 23491 }, { "epoch": 0.64, "learning_rate": 6.015001479424967e-06, "loss": 1.4089, "step": 23492 }, { "epoch": 0.64, "learning_rate": 6.014190252968908e-06, "loss": 1.3506, "step": 23493 }, { "epoch": 0.64, "learning_rate": 6.0133790576959515e-06, "loss": 1.2864, "step": 23494 }, { "epoch": 0.64, "learning_rate": 6.01256789361244e-06, "loss": 1.353, "step": 23495 }, { "epoch": 0.64, "learning_rate": 6.011756760724721e-06, "loss": 1.0543, "step": 23496 }, { "epoch": 0.64, "learning_rate": 6.010945659039145e-06, "loss": 1.2976, "step": 23497 }, { "epoch": 0.64, "learning_rate": 6.010134588562053e-06, "loss": 1.2642, "step": 23498 }, { "epoch": 0.64, "learning_rate": 6.009323549299793e-06, "loss": 1.2319, "step": 23499 }, { "epoch": 0.64, "learning_rate": 6.008512541258708e-06, "loss": 1.415, "step": 23500 }, { "epoch": 0.64, "learning_rate": 6.007701564445145e-06, "loss": 1.354, "step": 23501 }, { "epoch": 0.64, "learning_rate": 6.006890618865446e-06, "loss": 1.366, "step": 23502 }, { "epoch": 0.64, "learning_rate": 6.00607970452596e-06, "loss": 1.0803, "step": 23503 }, { "epoch": 0.64, "learning_rate": 6.0052688214330255e-06, "loss": 1.355, "step": 23504 }, { "epoch": 0.64, "learning_rate": 6.004457969592992e-06, "loss": 1.3196, "step": 23505 }, { "epoch": 0.64, "learning_rate": 6.0036471490121975e-06, "loss": 1.3208, "step": 23506 }, { "epoch": 0.64, "learning_rate": 6.002836359696991e-06, "loss": 1.3159, "step": 23507 }, { "epoch": 0.64, "learning_rate": 6.0020256016537115e-06, "loss": 1.7578, "step": 23508 }, { "epoch": 0.64, "learning_rate": 6.001214874888704e-06, "loss": 1.3069, "step": 23509 }, { "epoch": 0.64, "learning_rate": 6.000404179408312e-06, "loss": 1.3254, "step": 23510 }, { "epoch": 0.64, "learning_rate": 5.9995935152188754e-06, "loss": 1.0959, "step": 23511 }, { "epoch": 0.64, "learning_rate": 5.998782882326739e-06, "loss": 1.082, "step": 23512 }, { "epoch": 0.64, "learning_rate": 5.997972280738242e-06, "loss": 1.1946, "step": 23513 }, { "epoch": 0.64, "learning_rate": 5.9971617104597315e-06, "loss": 1.3623, "step": 23514 }, { "epoch": 0.64, "learning_rate": 5.996351171497543e-06, "loss": 1.3157, "step": 23515 }, { "epoch": 0.64, "learning_rate": 5.995540663858022e-06, "loss": 1.2634, "step": 23516 }, { "epoch": 0.64, "learning_rate": 5.994730187547505e-06, "loss": 1.1543, "step": 23517 }, { "epoch": 0.64, "learning_rate": 5.993919742572339e-06, "loss": 1.3447, "step": 23518 }, { "epoch": 0.64, "learning_rate": 5.9931093289388575e-06, "loss": 1.1262, "step": 23519 }, { "epoch": 0.64, "learning_rate": 5.9922989466534076e-06, "loss": 1.3423, "step": 23520 }, { "epoch": 0.64, "learning_rate": 5.991488595722325e-06, "loss": 1.2976, "step": 23521 }, { "epoch": 0.64, "learning_rate": 5.990678276151951e-06, "loss": 1.2988, "step": 23522 }, { "epoch": 0.64, "learning_rate": 5.989867987948624e-06, "loss": 1.3601, "step": 23523 }, { "epoch": 0.64, "learning_rate": 5.989057731118686e-06, "loss": 1.3093, "step": 23524 }, { "epoch": 0.64, "learning_rate": 5.988247505668472e-06, "loss": 1.3306, "step": 23525 }, { "epoch": 0.64, "learning_rate": 5.987437311604325e-06, "loss": 1.1758, "step": 23526 }, { "epoch": 0.64, "learning_rate": 5.98662714893258e-06, "loss": 1.3115, "step": 23527 }, { "epoch": 0.64, "learning_rate": 5.985817017659577e-06, "loss": 1.2871, "step": 23528 }, { "epoch": 0.64, "learning_rate": 5.985006917791655e-06, "loss": 1.208, "step": 23529 }, { "epoch": 0.64, "learning_rate": 5.9841968493351465e-06, "loss": 1.2651, "step": 23530 }, { "epoch": 0.64, "learning_rate": 5.983386812296402e-06, "loss": 1.2249, "step": 23531 }, { "epoch": 0.64, "learning_rate": 5.982576806681742e-06, "loss": 1.3091, "step": 23532 }, { "epoch": 0.64, "learning_rate": 5.98176683249752e-06, "loss": 1.2434, "step": 23533 }, { "epoch": 0.64, "learning_rate": 5.980956889750057e-06, "loss": 1.2588, "step": 23534 }, { "epoch": 0.64, "learning_rate": 5.980146978445704e-06, "loss": 1.3223, "step": 23535 }, { "epoch": 0.64, "learning_rate": 5.979337098590785e-06, "loss": 1.0996, "step": 23536 }, { "epoch": 0.64, "learning_rate": 5.978527250191648e-06, "loss": 1.1997, "step": 23537 }, { "epoch": 0.64, "learning_rate": 5.977717433254616e-06, "loss": 1.4216, "step": 23538 }, { "epoch": 0.64, "learning_rate": 5.976907647786039e-06, "loss": 1.2615, "step": 23539 }, { "epoch": 0.64, "learning_rate": 5.976097893792237e-06, "loss": 1.1577, "step": 23540 }, { "epoch": 0.64, "learning_rate": 5.975288171279559e-06, "loss": 1.2075, "step": 23541 }, { "epoch": 0.64, "learning_rate": 5.9744784802543284e-06, "loss": 1.3123, "step": 23542 }, { "epoch": 0.64, "learning_rate": 5.973668820722888e-06, "loss": 1.4014, "step": 23543 }, { "epoch": 0.64, "learning_rate": 5.9728591926915704e-06, "loss": 1.2493, "step": 23544 }, { "epoch": 0.64, "learning_rate": 5.972049596166707e-06, "loss": 1.2213, "step": 23545 }, { "epoch": 0.64, "learning_rate": 5.971240031154635e-06, "loss": 1.0342, "step": 23546 }, { "epoch": 0.64, "learning_rate": 5.970430497661686e-06, "loss": 1.3025, "step": 23547 }, { "epoch": 0.64, "learning_rate": 5.969620995694194e-06, "loss": 1.311, "step": 23548 }, { "epoch": 0.64, "learning_rate": 5.968811525258491e-06, "loss": 1.3459, "step": 23549 }, { "epoch": 0.64, "learning_rate": 5.9680020863609136e-06, "loss": 1.3176, "step": 23550 }, { "epoch": 0.64, "learning_rate": 5.96719267900779e-06, "loss": 1.2864, "step": 23551 }, { "epoch": 0.64, "learning_rate": 5.966383303205455e-06, "loss": 1.2732, "step": 23552 }, { "epoch": 0.64, "learning_rate": 5.9655739589602405e-06, "loss": 1.323, "step": 23553 }, { "epoch": 0.64, "learning_rate": 5.964764646278478e-06, "loss": 1.437, "step": 23554 }, { "epoch": 0.64, "learning_rate": 5.9639553651664985e-06, "loss": 1.1514, "step": 23555 }, { "epoch": 0.64, "learning_rate": 5.963146115630636e-06, "loss": 1.1248, "step": 23556 }, { "epoch": 0.64, "learning_rate": 5.962336897677219e-06, "loss": 1.3066, "step": 23557 }, { "epoch": 0.64, "learning_rate": 5.961527711312578e-06, "loss": 1.1409, "step": 23558 }, { "epoch": 0.64, "learning_rate": 5.960718556543048e-06, "loss": 1.4717, "step": 23559 }, { "epoch": 0.64, "learning_rate": 5.959909433374955e-06, "loss": 1.2075, "step": 23560 }, { "epoch": 0.64, "learning_rate": 5.959100341814632e-06, "loss": 1.3777, "step": 23561 }, { "epoch": 0.64, "learning_rate": 5.9582912818684055e-06, "loss": 1.1182, "step": 23562 }, { "epoch": 0.64, "learning_rate": 5.95748225354261e-06, "loss": 1.4302, "step": 23563 }, { "epoch": 0.64, "learning_rate": 5.956673256843571e-06, "loss": 1.3003, "step": 23564 }, { "epoch": 0.64, "learning_rate": 5.95586429177762e-06, "loss": 1.3665, "step": 23565 }, { "epoch": 0.64, "learning_rate": 5.955055358351084e-06, "loss": 1.2266, "step": 23566 }, { "epoch": 0.64, "learning_rate": 5.954246456570294e-06, "loss": 1.2749, "step": 23567 }, { "epoch": 0.64, "learning_rate": 5.953437586441577e-06, "loss": 1.2683, "step": 23568 }, { "epoch": 0.64, "learning_rate": 5.952628747971262e-06, "loss": 1.2668, "step": 23569 }, { "epoch": 0.64, "learning_rate": 5.951819941165675e-06, "loss": 1.3293, "step": 23570 }, { "epoch": 0.64, "learning_rate": 5.951011166031147e-06, "loss": 1.2839, "step": 23571 }, { "epoch": 0.64, "learning_rate": 5.950202422574001e-06, "loss": 1.207, "step": 23572 }, { "epoch": 0.64, "learning_rate": 5.949393710800569e-06, "loss": 1.2251, "step": 23573 }, { "epoch": 0.64, "learning_rate": 5.948585030717175e-06, "loss": 1.1736, "step": 23574 }, { "epoch": 0.64, "learning_rate": 5.947776382330144e-06, "loss": 1.3657, "step": 23575 }, { "epoch": 0.64, "learning_rate": 5.94696776564581e-06, "loss": 1.2627, "step": 23576 }, { "epoch": 0.64, "learning_rate": 5.94615918067049e-06, "loss": 1.4426, "step": 23577 }, { "epoch": 0.64, "learning_rate": 5.94535062741052e-06, "loss": 1.177, "step": 23578 }, { "epoch": 0.64, "learning_rate": 5.944542105872213e-06, "loss": 1.302, "step": 23579 }, { "epoch": 0.64, "learning_rate": 5.943733616061908e-06, "loss": 1.2351, "step": 23580 }, { "epoch": 0.64, "learning_rate": 5.942925157985919e-06, "loss": 1.3296, "step": 23581 }, { "epoch": 0.64, "learning_rate": 5.9421167316505815e-06, "loss": 1.2136, "step": 23582 }, { "epoch": 0.64, "learning_rate": 5.941308337062208e-06, "loss": 1.262, "step": 23583 }, { "epoch": 0.64, "learning_rate": 5.9404999742271355e-06, "loss": 1.1633, "step": 23584 }, { "epoch": 0.64, "learning_rate": 5.939691643151676e-06, "loss": 1.2935, "step": 23585 }, { "epoch": 0.64, "learning_rate": 5.938883343842165e-06, "loss": 1.27, "step": 23586 }, { "epoch": 0.64, "learning_rate": 5.938075076304916e-06, "loss": 1.2218, "step": 23587 }, { "epoch": 0.64, "learning_rate": 5.937266840546265e-06, "loss": 1.415, "step": 23588 }, { "epoch": 0.64, "learning_rate": 5.93645863657252e-06, "loss": 1.5371, "step": 23589 }, { "epoch": 0.64, "learning_rate": 5.935650464390015e-06, "loss": 1.0837, "step": 23590 }, { "epoch": 0.64, "learning_rate": 5.9348423240050705e-06, "loss": 1.2905, "step": 23591 }, { "epoch": 0.64, "learning_rate": 5.934034215424007e-06, "loss": 1.188, "step": 23592 }, { "epoch": 0.64, "learning_rate": 5.93322613865315e-06, "loss": 1.1, "step": 23593 }, { "epoch": 0.64, "learning_rate": 5.932418093698815e-06, "loss": 1.1543, "step": 23594 }, { "epoch": 0.64, "learning_rate": 5.931610080567333e-06, "loss": 1.1755, "step": 23595 }, { "epoch": 0.64, "learning_rate": 5.930802099265016e-06, "loss": 1.2656, "step": 23596 }, { "epoch": 0.64, "learning_rate": 5.929994149798195e-06, "loss": 1.2939, "step": 23597 }, { "epoch": 0.64, "learning_rate": 5.929186232173181e-06, "loss": 1.262, "step": 23598 }, { "epoch": 0.64, "learning_rate": 5.928378346396304e-06, "loss": 1.3472, "step": 23599 }, { "epoch": 0.64, "learning_rate": 5.9275704924738776e-06, "loss": 1.877, "step": 23600 }, { "epoch": 0.64, "learning_rate": 5.926762670412225e-06, "loss": 1.3657, "step": 23601 }, { "epoch": 0.64, "learning_rate": 5.925954880217666e-06, "loss": 1.2568, "step": 23602 }, { "epoch": 0.64, "learning_rate": 5.92514712189652e-06, "loss": 1.0686, "step": 23603 }, { "epoch": 0.64, "learning_rate": 5.9243393954551075e-06, "loss": 1.2751, "step": 23604 }, { "epoch": 0.64, "learning_rate": 5.923531700899745e-06, "loss": 1.2642, "step": 23605 }, { "epoch": 0.64, "learning_rate": 5.922724038236757e-06, "loss": 1.2429, "step": 23606 }, { "epoch": 0.64, "learning_rate": 5.921916407472456e-06, "loss": 1.2458, "step": 23607 }, { "epoch": 0.64, "learning_rate": 5.921108808613165e-06, "loss": 1.3044, "step": 23608 }, { "epoch": 0.64, "learning_rate": 5.920301241665199e-06, "loss": 1.3643, "step": 23609 }, { "epoch": 0.64, "learning_rate": 5.9194937066348805e-06, "loss": 1.2717, "step": 23610 }, { "epoch": 0.64, "learning_rate": 5.918686203528522e-06, "loss": 1.7139, "step": 23611 }, { "epoch": 0.64, "learning_rate": 5.9178787323524445e-06, "loss": 1.3696, "step": 23612 }, { "epoch": 0.64, "learning_rate": 5.917071293112963e-06, "loss": 1.4092, "step": 23613 }, { "epoch": 0.64, "learning_rate": 5.916263885816398e-06, "loss": 1.2004, "step": 23614 }, { "epoch": 0.64, "learning_rate": 5.915456510469062e-06, "loss": 1.1785, "step": 23615 }, { "epoch": 0.64, "learning_rate": 5.914649167077275e-06, "loss": 1.291, "step": 23616 }, { "epoch": 0.64, "learning_rate": 5.913841855647351e-06, "loss": 1.1543, "step": 23617 }, { "epoch": 0.64, "learning_rate": 5.913034576185608e-06, "loss": 1.2085, "step": 23618 }, { "epoch": 0.65, "learning_rate": 5.912227328698359e-06, "loss": 1.2546, "step": 23619 }, { "epoch": 0.65, "learning_rate": 5.911420113191919e-06, "loss": 1.2278, "step": 23620 }, { "epoch": 0.65, "learning_rate": 5.910612929672612e-06, "loss": 1.2739, "step": 23621 }, { "epoch": 0.65, "learning_rate": 5.90980577814674e-06, "loss": 1.3303, "step": 23622 }, { "epoch": 0.65, "learning_rate": 5.908998658620631e-06, "loss": 1.2852, "step": 23623 }, { "epoch": 0.65, "learning_rate": 5.908191571100586e-06, "loss": 1.3181, "step": 23624 }, { "epoch": 0.65, "learning_rate": 5.907384515592931e-06, "loss": 1.2148, "step": 23625 }, { "epoch": 0.65, "learning_rate": 5.9065774921039695e-06, "loss": 1.2222, "step": 23626 }, { "epoch": 0.65, "learning_rate": 5.905770500640028e-06, "loss": 1.2458, "step": 23627 }, { "epoch": 0.65, "learning_rate": 5.904963541207407e-06, "loss": 1.2322, "step": 23628 }, { "epoch": 0.65, "learning_rate": 5.904156613812431e-06, "loss": 1.2747, "step": 23629 }, { "epoch": 0.65, "learning_rate": 5.903349718461401e-06, "loss": 1.2856, "step": 23630 }, { "epoch": 0.65, "learning_rate": 5.902542855160642e-06, "loss": 1.0796, "step": 23631 }, { "epoch": 0.65, "learning_rate": 5.901736023916457e-06, "loss": 1.3657, "step": 23632 }, { "epoch": 0.65, "learning_rate": 5.900929224735167e-06, "loss": 1.0676, "step": 23633 }, { "epoch": 0.65, "learning_rate": 5.900122457623073e-06, "loss": 1.345, "step": 23634 }, { "epoch": 0.65, "learning_rate": 5.8993157225865e-06, "loss": 1.3174, "step": 23635 }, { "epoch": 0.65, "learning_rate": 5.898509019631745e-06, "loss": 1.2747, "step": 23636 }, { "epoch": 0.65, "learning_rate": 5.89770234876513e-06, "loss": 1.312, "step": 23637 }, { "epoch": 0.65, "learning_rate": 5.896895709992965e-06, "loss": 1.2869, "step": 23638 }, { "epoch": 0.65, "learning_rate": 5.896089103321555e-06, "loss": 1.3079, "step": 23639 }, { "epoch": 0.65, "learning_rate": 5.895282528757218e-06, "loss": 1.1819, "step": 23640 }, { "epoch": 0.65, "learning_rate": 5.894475986306256e-06, "loss": 1.2783, "step": 23641 }, { "epoch": 0.65, "learning_rate": 5.893669475974988e-06, "loss": 1.1067, "step": 23642 }, { "epoch": 0.65, "learning_rate": 5.892862997769715e-06, "loss": 1.2188, "step": 23643 }, { "epoch": 0.65, "learning_rate": 5.892056551696754e-06, "loss": 1.2173, "step": 23644 }, { "epoch": 0.65, "learning_rate": 5.891250137762407e-06, "loss": 1.1636, "step": 23645 }, { "epoch": 0.65, "learning_rate": 5.890443755972991e-06, "loss": 1.2559, "step": 23646 }, { "epoch": 0.65, "learning_rate": 5.889637406334807e-06, "loss": 1.2791, "step": 23647 }, { "epoch": 0.65, "learning_rate": 5.88883108885417e-06, "loss": 1.5649, "step": 23648 }, { "epoch": 0.65, "learning_rate": 5.888024803537384e-06, "loss": 1.2688, "step": 23649 }, { "epoch": 0.65, "learning_rate": 5.887218550390758e-06, "loss": 1.0808, "step": 23650 }, { "epoch": 0.65, "learning_rate": 5.886412329420601e-06, "loss": 1.4209, "step": 23651 }, { "epoch": 0.65, "learning_rate": 5.885606140633218e-06, "loss": 1.2703, "step": 23652 }, { "epoch": 0.65, "learning_rate": 5.884799984034919e-06, "loss": 1.2, "step": 23653 }, { "epoch": 0.65, "learning_rate": 5.883993859632009e-06, "loss": 1.1438, "step": 23654 }, { "epoch": 0.65, "learning_rate": 5.883187767430798e-06, "loss": 1.2603, "step": 23655 }, { "epoch": 0.65, "learning_rate": 5.882381707437588e-06, "loss": 1.244, "step": 23656 }, { "epoch": 0.65, "learning_rate": 5.8815756796586885e-06, "loss": 1.3215, "step": 23657 }, { "epoch": 0.65, "learning_rate": 5.8807696841004024e-06, "loss": 1.1804, "step": 23658 }, { "epoch": 0.65, "learning_rate": 5.879963720769038e-06, "loss": 1.2998, "step": 23659 }, { "epoch": 0.65, "learning_rate": 5.8791577896709e-06, "loss": 1.3308, "step": 23660 }, { "epoch": 0.65, "learning_rate": 5.878351890812295e-06, "loss": 1.1519, "step": 23661 }, { "epoch": 0.65, "learning_rate": 5.8775460241995255e-06, "loss": 1.2218, "step": 23662 }, { "epoch": 0.65, "learning_rate": 5.876740189838899e-06, "loss": 1.1584, "step": 23663 }, { "epoch": 0.65, "learning_rate": 5.875934387736715e-06, "loss": 1.3301, "step": 23664 }, { "epoch": 0.65, "learning_rate": 5.875128617899284e-06, "loss": 1.29, "step": 23665 }, { "epoch": 0.65, "learning_rate": 5.874322880332906e-06, "loss": 1.3621, "step": 23666 }, { "epoch": 0.65, "learning_rate": 5.873517175043882e-06, "loss": 1.1763, "step": 23667 }, { "epoch": 0.65, "learning_rate": 5.872711502038526e-06, "loss": 1.1733, "step": 23668 }, { "epoch": 0.65, "learning_rate": 5.871905861323129e-06, "loss": 1.4277, "step": 23669 }, { "epoch": 0.65, "learning_rate": 5.871100252904005e-06, "loss": 1.3914, "step": 23670 }, { "epoch": 0.65, "learning_rate": 5.870294676787444e-06, "loss": 1.3467, "step": 23671 }, { "epoch": 0.65, "learning_rate": 5.869489132979764e-06, "loss": 1.2722, "step": 23672 }, { "epoch": 0.65, "learning_rate": 5.8686836214872515e-06, "loss": 1.2524, "step": 23673 }, { "epoch": 0.65, "learning_rate": 5.867878142316221e-06, "loss": 1.3696, "step": 23674 }, { "epoch": 0.65, "learning_rate": 5.8670726954729636e-06, "loss": 1.2756, "step": 23675 }, { "epoch": 0.65, "learning_rate": 5.866267280963791e-06, "loss": 1.2698, "step": 23676 }, { "epoch": 0.65, "learning_rate": 5.865461898794995e-06, "loss": 1.4021, "step": 23677 }, { "epoch": 0.65, "learning_rate": 5.8646565489728845e-06, "loss": 1.3235, "step": 23678 }, { "epoch": 0.65, "learning_rate": 5.863851231503752e-06, "loss": 1.2283, "step": 23679 }, { "epoch": 0.65, "learning_rate": 5.863045946393909e-06, "loss": 1.3228, "step": 23680 }, { "epoch": 0.65, "learning_rate": 5.8622406936496434e-06, "loss": 1.2446, "step": 23681 }, { "epoch": 0.65, "learning_rate": 5.8614354732772616e-06, "loss": 1.3088, "step": 23682 }, { "epoch": 0.65, "learning_rate": 5.860630285283066e-06, "loss": 1.2339, "step": 23683 }, { "epoch": 0.65, "learning_rate": 5.859825129673349e-06, "loss": 1.1877, "step": 23684 }, { "epoch": 0.65, "learning_rate": 5.859020006454416e-06, "loss": 1.3557, "step": 23685 }, { "epoch": 0.65, "learning_rate": 5.858214915632562e-06, "loss": 1.4175, "step": 23686 }, { "epoch": 0.65, "learning_rate": 5.857409857214088e-06, "loss": 1.2998, "step": 23687 }, { "epoch": 0.65, "learning_rate": 5.8566048312052905e-06, "loss": 1.3044, "step": 23688 }, { "epoch": 0.65, "learning_rate": 5.855799837612468e-06, "loss": 1.3857, "step": 23689 }, { "epoch": 0.65, "learning_rate": 5.8549948764419194e-06, "loss": 1.458, "step": 23690 }, { "epoch": 0.65, "learning_rate": 5.854189947699942e-06, "loss": 1.353, "step": 23691 }, { "epoch": 0.65, "learning_rate": 5.8533850513928325e-06, "loss": 1.3691, "step": 23692 }, { "epoch": 0.65, "learning_rate": 5.852580187526888e-06, "loss": 1.2478, "step": 23693 }, { "epoch": 0.65, "learning_rate": 5.851775356108407e-06, "loss": 1.3035, "step": 23694 }, { "epoch": 0.65, "learning_rate": 5.850970557143685e-06, "loss": 1.25, "step": 23695 }, { "epoch": 0.65, "learning_rate": 5.850165790639018e-06, "loss": 1.2881, "step": 23696 }, { "epoch": 0.65, "learning_rate": 5.849361056600702e-06, "loss": 1.1699, "step": 23697 }, { "epoch": 0.65, "learning_rate": 5.848556355035034e-06, "loss": 1.3525, "step": 23698 }, { "epoch": 0.65, "learning_rate": 5.847751685948306e-06, "loss": 1.2058, "step": 23699 }, { "epoch": 0.65, "learning_rate": 5.846947049346821e-06, "loss": 1.3306, "step": 23700 }, { "epoch": 0.65, "learning_rate": 5.8461424452368655e-06, "loss": 1.2878, "step": 23701 }, { "epoch": 0.65, "learning_rate": 5.845337873624741e-06, "loss": 1.384, "step": 23702 }, { "epoch": 0.65, "learning_rate": 5.844533334516738e-06, "loss": 1.2109, "step": 23703 }, { "epoch": 0.65, "learning_rate": 5.843728827919153e-06, "loss": 1.2832, "step": 23704 }, { "epoch": 0.65, "learning_rate": 5.842924353838277e-06, "loss": 1.2249, "step": 23705 }, { "epoch": 0.65, "learning_rate": 5.842119912280408e-06, "loss": 1.207, "step": 23706 }, { "epoch": 0.65, "learning_rate": 5.841315503251837e-06, "loss": 1.3882, "step": 23707 }, { "epoch": 0.65, "learning_rate": 5.840511126758859e-06, "loss": 1.3696, "step": 23708 }, { "epoch": 0.65, "learning_rate": 5.839706782807765e-06, "loss": 1.0754, "step": 23709 }, { "epoch": 0.65, "learning_rate": 5.838902471404851e-06, "loss": 1.238, "step": 23710 }, { "epoch": 0.65, "learning_rate": 5.838098192556401e-06, "loss": 1.238, "step": 23711 }, { "epoch": 0.65, "learning_rate": 5.837293946268719e-06, "loss": 0.9624, "step": 23712 }, { "epoch": 0.65, "learning_rate": 5.836489732548092e-06, "loss": 1.083, "step": 23713 }, { "epoch": 0.65, "learning_rate": 5.835685551400807e-06, "loss": 1.3633, "step": 23714 }, { "epoch": 0.65, "learning_rate": 5.834881402833166e-06, "loss": 1.2622, "step": 23715 }, { "epoch": 0.65, "learning_rate": 5.834077286851452e-06, "loss": 1.2532, "step": 23716 }, { "epoch": 0.65, "learning_rate": 5.83327320346196e-06, "loss": 1.2148, "step": 23717 }, { "epoch": 0.65, "learning_rate": 5.832469152670974e-06, "loss": 1.3428, "step": 23718 }, { "epoch": 0.65, "learning_rate": 5.831665134484794e-06, "loss": 1.4033, "step": 23719 }, { "epoch": 0.65, "learning_rate": 5.830861148909705e-06, "loss": 1.3757, "step": 23720 }, { "epoch": 0.65, "learning_rate": 5.830057195951999e-06, "loss": 1.2786, "step": 23721 }, { "epoch": 0.65, "learning_rate": 5.829253275617961e-06, "loss": 1.324, "step": 23722 }, { "epoch": 0.65, "learning_rate": 5.8284493879138855e-06, "loss": 1.2263, "step": 23723 }, { "epoch": 0.65, "learning_rate": 5.827645532846063e-06, "loss": 1.2454, "step": 23724 }, { "epoch": 0.65, "learning_rate": 5.8268417104207795e-06, "loss": 1.269, "step": 23725 }, { "epoch": 0.65, "learning_rate": 5.826037920644321e-06, "loss": 1.3823, "step": 23726 }, { "epoch": 0.65, "learning_rate": 5.825234163522981e-06, "loss": 1.4607, "step": 23727 }, { "epoch": 0.65, "learning_rate": 5.824430439063047e-06, "loss": 1.3452, "step": 23728 }, { "epoch": 0.65, "learning_rate": 5.823626747270801e-06, "loss": 1.2842, "step": 23729 }, { "epoch": 0.65, "learning_rate": 5.822823088152541e-06, "loss": 1.4187, "step": 23730 }, { "epoch": 0.65, "learning_rate": 5.822019461714543e-06, "loss": 1.3833, "step": 23731 }, { "epoch": 0.65, "learning_rate": 5.821215867963109e-06, "loss": 1.4424, "step": 23732 }, { "epoch": 0.65, "learning_rate": 5.820412306904509e-06, "loss": 1.3276, "step": 23733 }, { "epoch": 0.65, "learning_rate": 5.8196087785450424e-06, "loss": 1.2441, "step": 23734 }, { "epoch": 0.65, "learning_rate": 5.818805282890986e-06, "loss": 1.0718, "step": 23735 }, { "epoch": 0.65, "learning_rate": 5.81800181994864e-06, "loss": 1.2012, "step": 23736 }, { "epoch": 0.65, "learning_rate": 5.817198389724272e-06, "loss": 1.2637, "step": 23737 }, { "epoch": 0.65, "learning_rate": 5.816394992224181e-06, "loss": 1.4121, "step": 23738 }, { "epoch": 0.65, "learning_rate": 5.815591627454644e-06, "loss": 1.2195, "step": 23739 }, { "epoch": 0.65, "learning_rate": 5.814788295421961e-06, "loss": 1.333, "step": 23740 }, { "epoch": 0.65, "learning_rate": 5.813984996132395e-06, "loss": 1.2388, "step": 23741 }, { "epoch": 0.65, "learning_rate": 5.813181729592248e-06, "loss": 1.3672, "step": 23742 }, { "epoch": 0.65, "learning_rate": 5.812378495807793e-06, "loss": 1.3591, "step": 23743 }, { "epoch": 0.65, "learning_rate": 5.811575294785326e-06, "loss": 1.2383, "step": 23744 }, { "epoch": 0.65, "learning_rate": 5.810772126531121e-06, "loss": 1.0854, "step": 23745 }, { "epoch": 0.65, "learning_rate": 5.809968991051463e-06, "loss": 1.2271, "step": 23746 }, { "epoch": 0.65, "learning_rate": 5.809165888352641e-06, "loss": 1.3154, "step": 23747 }, { "epoch": 0.65, "learning_rate": 5.8083628184409355e-06, "loss": 1.3594, "step": 23748 }, { "epoch": 0.65, "learning_rate": 5.807559781322627e-06, "loss": 1.208, "step": 23749 }, { "epoch": 0.65, "learning_rate": 5.806756777003995e-06, "loss": 1.3472, "step": 23750 }, { "epoch": 0.65, "learning_rate": 5.805953805491331e-06, "loss": 1.2283, "step": 23751 }, { "epoch": 0.65, "learning_rate": 5.805150866790912e-06, "loss": 1.2019, "step": 23752 }, { "epoch": 0.65, "learning_rate": 5.8043479609090205e-06, "loss": 1.2698, "step": 23753 }, { "epoch": 0.65, "learning_rate": 5.8035450878519315e-06, "loss": 1.4004, "step": 23754 }, { "epoch": 0.65, "learning_rate": 5.802742247625939e-06, "loss": 1.2671, "step": 23755 }, { "epoch": 0.65, "learning_rate": 5.801939440237316e-06, "loss": 1.2185, "step": 23756 }, { "epoch": 0.65, "learning_rate": 5.801136665692346e-06, "loss": 1.27, "step": 23757 }, { "epoch": 0.65, "learning_rate": 5.800333923997303e-06, "loss": 1.3188, "step": 23758 }, { "epoch": 0.65, "learning_rate": 5.7995312151584786e-06, "loss": 1.2747, "step": 23759 }, { "epoch": 0.65, "learning_rate": 5.798728539182144e-06, "loss": 1.2517, "step": 23760 }, { "epoch": 0.65, "learning_rate": 5.797925896074579e-06, "loss": 1.2036, "step": 23761 }, { "epoch": 0.65, "learning_rate": 5.79712328584207e-06, "loss": 1.3516, "step": 23762 }, { "epoch": 0.65, "learning_rate": 5.796320708490892e-06, "loss": 1.2361, "step": 23763 }, { "epoch": 0.65, "learning_rate": 5.795518164027324e-06, "loss": 1.2202, "step": 23764 }, { "epoch": 0.65, "learning_rate": 5.794715652457641e-06, "loss": 1.3367, "step": 23765 }, { "epoch": 0.65, "learning_rate": 5.7939131737881285e-06, "loss": 1.4194, "step": 23766 }, { "epoch": 0.65, "learning_rate": 5.793110728025062e-06, "loss": 1.3347, "step": 23767 }, { "epoch": 0.65, "learning_rate": 5.792308315174719e-06, "loss": 1.1885, "step": 23768 }, { "epoch": 0.65, "learning_rate": 5.791505935243373e-06, "loss": 1.3982, "step": 23769 }, { "epoch": 0.65, "learning_rate": 5.79070358823731e-06, "loss": 1.2952, "step": 23770 }, { "epoch": 0.65, "learning_rate": 5.7899012741628035e-06, "loss": 1.1978, "step": 23771 }, { "epoch": 0.65, "learning_rate": 5.789098993026128e-06, "loss": 1.3521, "step": 23772 }, { "epoch": 0.65, "learning_rate": 5.788296744833559e-06, "loss": 1.3164, "step": 23773 }, { "epoch": 0.65, "learning_rate": 5.78749452959138e-06, "loss": 1.3601, "step": 23774 }, { "epoch": 0.65, "learning_rate": 5.786692347305862e-06, "loss": 1.1263, "step": 23775 }, { "epoch": 0.65, "learning_rate": 5.785890197983277e-06, "loss": 1.1704, "step": 23776 }, { "epoch": 0.65, "learning_rate": 5.7850880816299115e-06, "loss": 1.1882, "step": 23777 }, { "epoch": 0.65, "learning_rate": 5.7842859982520305e-06, "loss": 1.3923, "step": 23778 }, { "epoch": 0.65, "learning_rate": 5.78348394785592e-06, "loss": 1.3352, "step": 23779 }, { "epoch": 0.65, "learning_rate": 5.7826819304478424e-06, "loss": 1.4214, "step": 23780 }, { "epoch": 0.65, "learning_rate": 5.78187994603408e-06, "loss": 1.6931, "step": 23781 }, { "epoch": 0.65, "learning_rate": 5.781077994620903e-06, "loss": 1.1194, "step": 23782 }, { "epoch": 0.65, "learning_rate": 5.7802760762145945e-06, "loss": 1.7144, "step": 23783 }, { "epoch": 0.65, "learning_rate": 5.779474190821416e-06, "loss": 1.3015, "step": 23784 }, { "epoch": 0.65, "learning_rate": 5.778672338447648e-06, "loss": 1.4077, "step": 23785 }, { "epoch": 0.65, "learning_rate": 5.7778705190995625e-06, "loss": 1.1951, "step": 23786 }, { "epoch": 0.65, "learning_rate": 5.7770687327834375e-06, "loss": 1.394, "step": 23787 }, { "epoch": 0.65, "learning_rate": 5.776266979505534e-06, "loss": 1.2017, "step": 23788 }, { "epoch": 0.65, "learning_rate": 5.775465259272135e-06, "loss": 1.2881, "step": 23789 }, { "epoch": 0.65, "learning_rate": 5.774663572089505e-06, "loss": 1.4336, "step": 23790 }, { "epoch": 0.65, "learning_rate": 5.773861917963926e-06, "loss": 1.2583, "step": 23791 }, { "epoch": 0.65, "learning_rate": 5.773060296901662e-06, "loss": 1.2188, "step": 23792 }, { "epoch": 0.65, "learning_rate": 5.7722587089089844e-06, "loss": 1.1204, "step": 23793 }, { "epoch": 0.65, "learning_rate": 5.771457153992169e-06, "loss": 1.3569, "step": 23794 }, { "epoch": 0.65, "learning_rate": 5.770655632157485e-06, "loss": 1.0214, "step": 23795 }, { "epoch": 0.65, "learning_rate": 5.769854143411203e-06, "loss": 1.2178, "step": 23796 }, { "epoch": 0.65, "learning_rate": 5.769052687759589e-06, "loss": 1.4438, "step": 23797 }, { "epoch": 0.65, "learning_rate": 5.7682512652089216e-06, "loss": 1.2078, "step": 23798 }, { "epoch": 0.65, "learning_rate": 5.767449875765465e-06, "loss": 1.3901, "step": 23799 }, { "epoch": 0.65, "learning_rate": 5.766648519435491e-06, "loss": 1.1414, "step": 23800 }, { "epoch": 0.65, "learning_rate": 5.765847196225265e-06, "loss": 1.3533, "step": 23801 }, { "epoch": 0.65, "learning_rate": 5.7650459061410625e-06, "loss": 1.2136, "step": 23802 }, { "epoch": 0.65, "learning_rate": 5.76424464918915e-06, "loss": 1.1907, "step": 23803 }, { "epoch": 0.65, "learning_rate": 5.763443425375796e-06, "loss": 1.2244, "step": 23804 }, { "epoch": 0.65, "learning_rate": 5.762642234707263e-06, "loss": 1.3503, "step": 23805 }, { "epoch": 0.65, "learning_rate": 5.7618410771898305e-06, "loss": 1.0967, "step": 23806 }, { "epoch": 0.65, "learning_rate": 5.761039952829759e-06, "loss": 1.3679, "step": 23807 }, { "epoch": 0.65, "learning_rate": 5.760238861633314e-06, "loss": 1.0471, "step": 23808 }, { "epoch": 0.65, "learning_rate": 5.759437803606771e-06, "loss": 1.3848, "step": 23809 }, { "epoch": 0.65, "learning_rate": 5.758636778756392e-06, "loss": 1.2461, "step": 23810 }, { "epoch": 0.65, "learning_rate": 5.7578357870884434e-06, "loss": 1.1663, "step": 23811 }, { "epoch": 0.65, "learning_rate": 5.757034828609192e-06, "loss": 1.2942, "step": 23812 }, { "epoch": 0.65, "learning_rate": 5.756233903324906e-06, "loss": 1.4087, "step": 23813 }, { "epoch": 0.65, "learning_rate": 5.755433011241851e-06, "loss": 1.3706, "step": 23814 }, { "epoch": 0.65, "learning_rate": 5.754632152366293e-06, "loss": 1.3088, "step": 23815 }, { "epoch": 0.65, "learning_rate": 5.753831326704492e-06, "loss": 1.3247, "step": 23816 }, { "epoch": 0.65, "learning_rate": 5.753030534262722e-06, "loss": 1.2662, "step": 23817 }, { "epoch": 0.65, "learning_rate": 5.752229775047245e-06, "loss": 1.2437, "step": 23818 }, { "epoch": 0.65, "learning_rate": 5.751429049064323e-06, "loss": 1.3416, "step": 23819 }, { "epoch": 0.65, "learning_rate": 5.75062835632022e-06, "loss": 1.2061, "step": 23820 }, { "epoch": 0.65, "learning_rate": 5.749827696821206e-06, "loss": 1.1643, "step": 23821 }, { "epoch": 0.65, "learning_rate": 5.749027070573541e-06, "loss": 1.3108, "step": 23822 }, { "epoch": 0.65, "learning_rate": 5.748226477583485e-06, "loss": 1.3528, "step": 23823 }, { "epoch": 0.65, "learning_rate": 5.747425917857311e-06, "loss": 1.3535, "step": 23824 }, { "epoch": 0.65, "learning_rate": 5.746625391401273e-06, "loss": 1.2795, "step": 23825 }, { "epoch": 0.65, "learning_rate": 5.745824898221644e-06, "loss": 1.4924, "step": 23826 }, { "epoch": 0.65, "learning_rate": 5.7450244383246745e-06, "loss": 1.6802, "step": 23827 }, { "epoch": 0.65, "learning_rate": 5.7442240117166356e-06, "loss": 1.3223, "step": 23828 }, { "epoch": 0.65, "learning_rate": 5.743423618403784e-06, "loss": 1.3013, "step": 23829 }, { "epoch": 0.65, "learning_rate": 5.7426232583923916e-06, "loss": 1.1414, "step": 23830 }, { "epoch": 0.65, "learning_rate": 5.741822931688706e-06, "loss": 1.4346, "step": 23831 }, { "epoch": 0.65, "learning_rate": 5.7410226382989975e-06, "loss": 1.8105, "step": 23832 }, { "epoch": 0.65, "learning_rate": 5.740222378229523e-06, "loss": 1.1445, "step": 23833 }, { "epoch": 0.65, "learning_rate": 5.739422151486552e-06, "loss": 1.7188, "step": 23834 }, { "epoch": 0.65, "learning_rate": 5.738621958076331e-06, "loss": 1.125, "step": 23835 }, { "epoch": 0.65, "learning_rate": 5.737821798005132e-06, "loss": 1.2229, "step": 23836 }, { "epoch": 0.65, "learning_rate": 5.737021671279208e-06, "loss": 1.1047, "step": 23837 }, { "epoch": 0.65, "learning_rate": 5.736221577904826e-06, "loss": 1.2017, "step": 23838 }, { "epoch": 0.65, "learning_rate": 5.73542151788824e-06, "loss": 1.3196, "step": 23839 }, { "epoch": 0.65, "learning_rate": 5.734621491235707e-06, "loss": 1.2388, "step": 23840 }, { "epoch": 0.65, "learning_rate": 5.7338214979534936e-06, "loss": 1.4141, "step": 23841 }, { "epoch": 0.65, "learning_rate": 5.733021538047856e-06, "loss": 1.2129, "step": 23842 }, { "epoch": 0.65, "learning_rate": 5.732221611525051e-06, "loss": 1.3098, "step": 23843 }, { "epoch": 0.65, "learning_rate": 5.731421718391333e-06, "loss": 1.2021, "step": 23844 }, { "epoch": 0.65, "learning_rate": 5.730621858652967e-06, "loss": 1.219, "step": 23845 }, { "epoch": 0.65, "learning_rate": 5.729822032316209e-06, "loss": 1.2295, "step": 23846 }, { "epoch": 0.65, "learning_rate": 5.7290222393873156e-06, "loss": 1.2642, "step": 23847 }, { "epoch": 0.65, "learning_rate": 5.728222479872539e-06, "loss": 1.3503, "step": 23848 }, { "epoch": 0.65, "learning_rate": 5.7274227537781466e-06, "loss": 1.2363, "step": 23849 }, { "epoch": 0.65, "learning_rate": 5.726623061110388e-06, "loss": 1.3582, "step": 23850 }, { "epoch": 0.65, "learning_rate": 5.725823401875521e-06, "loss": 1.1897, "step": 23851 }, { "epoch": 0.65, "learning_rate": 5.725023776079799e-06, "loss": 1.231, "step": 23852 }, { "epoch": 0.65, "learning_rate": 5.724224183729485e-06, "loss": 1.2075, "step": 23853 }, { "epoch": 0.65, "learning_rate": 5.723424624830829e-06, "loss": 1.4177, "step": 23854 }, { "epoch": 0.65, "learning_rate": 5.722625099390085e-06, "loss": 1.311, "step": 23855 }, { "epoch": 0.65, "learning_rate": 5.721825607413513e-06, "loss": 1.2258, "step": 23856 }, { "epoch": 0.65, "learning_rate": 5.7210261489073675e-06, "loss": 1.165, "step": 23857 }, { "epoch": 0.65, "learning_rate": 5.720226723877901e-06, "loss": 1.1704, "step": 23858 }, { "epoch": 0.65, "learning_rate": 5.719427332331365e-06, "loss": 1.3025, "step": 23859 }, { "epoch": 0.65, "learning_rate": 5.718627974274018e-06, "loss": 1.4688, "step": 23860 }, { "epoch": 0.65, "learning_rate": 5.717828649712114e-06, "loss": 1.2554, "step": 23861 }, { "epoch": 0.65, "learning_rate": 5.717029358651906e-06, "loss": 1.175, "step": 23862 }, { "epoch": 0.65, "learning_rate": 5.71623010109964e-06, "loss": 1.313, "step": 23863 }, { "epoch": 0.65, "learning_rate": 5.715430877061581e-06, "loss": 1.2434, "step": 23864 }, { "epoch": 0.65, "learning_rate": 5.714631686543977e-06, "loss": 1.2458, "step": 23865 }, { "epoch": 0.65, "learning_rate": 5.713832529553077e-06, "loss": 1.293, "step": 23866 }, { "epoch": 0.65, "learning_rate": 5.713033406095133e-06, "loss": 1.2175, "step": 23867 }, { "epoch": 0.65, "learning_rate": 5.712234316176399e-06, "loss": 1.2407, "step": 23868 }, { "epoch": 0.65, "learning_rate": 5.711435259803137e-06, "loss": 1.0542, "step": 23869 }, { "epoch": 0.65, "learning_rate": 5.7106362369815805e-06, "loss": 1.3369, "step": 23870 }, { "epoch": 0.65, "learning_rate": 5.7098372477179935e-06, "loss": 1.4165, "step": 23871 }, { "epoch": 0.65, "learning_rate": 5.709038292018617e-06, "loss": 1.2874, "step": 23872 }, { "epoch": 0.65, "learning_rate": 5.7082393698897164e-06, "loss": 1.2576, "step": 23873 }, { "epoch": 0.65, "learning_rate": 5.7074404813375235e-06, "loss": 1.2771, "step": 23874 }, { "epoch": 0.65, "learning_rate": 5.706641626368303e-06, "loss": 1.2922, "step": 23875 }, { "epoch": 0.65, "learning_rate": 5.7058428049882955e-06, "loss": 1.2825, "step": 23876 }, { "epoch": 0.65, "learning_rate": 5.705044017203758e-06, "loss": 1.1914, "step": 23877 }, { "epoch": 0.65, "learning_rate": 5.704245263020938e-06, "loss": 1.4028, "step": 23878 }, { "epoch": 0.65, "learning_rate": 5.7034465424460805e-06, "loss": 1.2732, "step": 23879 }, { "epoch": 0.65, "learning_rate": 5.7026478554854345e-06, "loss": 1.2308, "step": 23880 }, { "epoch": 0.65, "learning_rate": 5.701849202145256e-06, "loss": 1.2864, "step": 23881 }, { "epoch": 0.65, "learning_rate": 5.701050582431786e-06, "loss": 1.2708, "step": 23882 }, { "epoch": 0.65, "learning_rate": 5.700251996351276e-06, "loss": 1.3481, "step": 23883 }, { "epoch": 0.65, "learning_rate": 5.699453443909968e-06, "loss": 1.1079, "step": 23884 }, { "epoch": 0.65, "learning_rate": 5.698654925114117e-06, "loss": 1.3577, "step": 23885 }, { "epoch": 0.65, "learning_rate": 5.697856439969969e-06, "loss": 1.3564, "step": 23886 }, { "epoch": 0.65, "learning_rate": 5.697057988483765e-06, "loss": 1.2695, "step": 23887 }, { "epoch": 0.65, "learning_rate": 5.6962595706617585e-06, "loss": 1.2817, "step": 23888 }, { "epoch": 0.65, "learning_rate": 5.695461186510194e-06, "loss": 1.3193, "step": 23889 }, { "epoch": 0.65, "learning_rate": 5.694662836035318e-06, "loss": 1.2949, "step": 23890 }, { "epoch": 0.65, "learning_rate": 5.693864519243371e-06, "loss": 1.2812, "step": 23891 }, { "epoch": 0.65, "learning_rate": 5.693066236140606e-06, "loss": 1.158, "step": 23892 }, { "epoch": 0.65, "learning_rate": 5.6922679867332665e-06, "loss": 1.2502, "step": 23893 }, { "epoch": 0.65, "learning_rate": 5.6914697710275965e-06, "loss": 1.3406, "step": 23894 }, { "epoch": 0.65, "learning_rate": 5.690671589029837e-06, "loss": 1.7642, "step": 23895 }, { "epoch": 0.65, "learning_rate": 5.689873440746241e-06, "loss": 1.321, "step": 23896 }, { "epoch": 0.65, "learning_rate": 5.689075326183049e-06, "loss": 1.2368, "step": 23897 }, { "epoch": 0.65, "learning_rate": 5.688277245346503e-06, "loss": 1.2844, "step": 23898 }, { "epoch": 0.65, "learning_rate": 5.687479198242845e-06, "loss": 1.2275, "step": 23899 }, { "epoch": 0.65, "learning_rate": 5.686681184878325e-06, "loss": 1.3269, "step": 23900 }, { "epoch": 0.65, "learning_rate": 5.685883205259184e-06, "loss": 1.1406, "step": 23901 }, { "epoch": 0.65, "learning_rate": 5.68508525939166e-06, "loss": 1.322, "step": 23902 }, { "epoch": 0.65, "learning_rate": 5.684287347282005e-06, "loss": 1.2573, "step": 23903 }, { "epoch": 0.65, "learning_rate": 5.683489468936455e-06, "loss": 1.0645, "step": 23904 }, { "epoch": 0.65, "learning_rate": 5.682691624361254e-06, "loss": 1.2251, "step": 23905 }, { "epoch": 0.65, "learning_rate": 5.68189381356264e-06, "loss": 1.2129, "step": 23906 }, { "epoch": 0.65, "learning_rate": 5.6810960365468616e-06, "loss": 1.2715, "step": 23907 }, { "epoch": 0.65, "learning_rate": 5.6802982933201565e-06, "loss": 1.2581, "step": 23908 }, { "epoch": 0.65, "learning_rate": 5.679500583888768e-06, "loss": 1.104, "step": 23909 }, { "epoch": 0.65, "learning_rate": 5.678702908258931e-06, "loss": 1.3655, "step": 23910 }, { "epoch": 0.65, "learning_rate": 5.6779052664368925e-06, "loss": 1.214, "step": 23911 }, { "epoch": 0.65, "learning_rate": 5.677107658428889e-06, "loss": 1.1257, "step": 23912 }, { "epoch": 0.65, "learning_rate": 5.676310084241168e-06, "loss": 1.345, "step": 23913 }, { "epoch": 0.65, "learning_rate": 5.6755125438799575e-06, "loss": 1.4089, "step": 23914 }, { "epoch": 0.65, "learning_rate": 5.674715037351504e-06, "loss": 1.2673, "step": 23915 }, { "epoch": 0.65, "learning_rate": 5.673917564662048e-06, "loss": 1.4087, "step": 23916 }, { "epoch": 0.65, "learning_rate": 5.673120125817828e-06, "loss": 1.1946, "step": 23917 }, { "epoch": 0.65, "learning_rate": 5.672322720825082e-06, "loss": 1.3464, "step": 23918 }, { "epoch": 0.65, "learning_rate": 5.671525349690043e-06, "loss": 1.4197, "step": 23919 }, { "epoch": 0.65, "learning_rate": 5.670728012418959e-06, "loss": 1.3845, "step": 23920 }, { "epoch": 0.65, "learning_rate": 5.669930709018063e-06, "loss": 1.3745, "step": 23921 }, { "epoch": 0.65, "learning_rate": 5.669133439493593e-06, "loss": 1.2556, "step": 23922 }, { "epoch": 0.65, "learning_rate": 5.668336203851782e-06, "loss": 1.6821, "step": 23923 }, { "epoch": 0.65, "learning_rate": 5.667539002098876e-06, "loss": 1.4062, "step": 23924 }, { "epoch": 0.65, "learning_rate": 5.666741834241107e-06, "loss": 1.293, "step": 23925 }, { "epoch": 0.65, "learning_rate": 5.665944700284713e-06, "loss": 1.2629, "step": 23926 }, { "epoch": 0.65, "learning_rate": 5.665147600235926e-06, "loss": 1.2664, "step": 23927 }, { "epoch": 0.65, "learning_rate": 5.66435053410099e-06, "loss": 1.0748, "step": 23928 }, { "epoch": 0.65, "learning_rate": 5.6635535018861354e-06, "loss": 1.29, "step": 23929 }, { "epoch": 0.65, "learning_rate": 5.662756503597595e-06, "loss": 1.1475, "step": 23930 }, { "epoch": 0.65, "learning_rate": 5.661959539241613e-06, "loss": 1.116, "step": 23931 }, { "epoch": 0.65, "learning_rate": 5.66116260882442e-06, "loss": 1.2786, "step": 23932 }, { "epoch": 0.65, "learning_rate": 5.660365712352249e-06, "loss": 1.3442, "step": 23933 }, { "epoch": 0.65, "learning_rate": 5.659568849831334e-06, "loss": 1.3169, "step": 23934 }, { "epoch": 0.65, "learning_rate": 5.658772021267914e-06, "loss": 1.3784, "step": 23935 }, { "epoch": 0.65, "learning_rate": 5.6579752266682205e-06, "loss": 1.325, "step": 23936 }, { "epoch": 0.65, "learning_rate": 5.657178466038488e-06, "loss": 1.1104, "step": 23937 }, { "epoch": 0.65, "learning_rate": 5.656381739384944e-06, "loss": 1.2705, "step": 23938 }, { "epoch": 0.65, "learning_rate": 5.655585046713831e-06, "loss": 1.373, "step": 23939 }, { "epoch": 0.65, "learning_rate": 5.654788388031378e-06, "loss": 1.241, "step": 23940 }, { "epoch": 0.65, "learning_rate": 5.653991763343817e-06, "loss": 1.2944, "step": 23941 }, { "epoch": 0.65, "learning_rate": 5.6531951726573765e-06, "loss": 1.1245, "step": 23942 }, { "epoch": 0.65, "learning_rate": 5.652398615978298e-06, "loss": 1.0758, "step": 23943 }, { "epoch": 0.65, "learning_rate": 5.651602093312807e-06, "loss": 1.1875, "step": 23944 }, { "epoch": 0.65, "learning_rate": 5.650805604667138e-06, "loss": 1.3708, "step": 23945 }, { "epoch": 0.65, "learning_rate": 5.650009150047515e-06, "loss": 1.186, "step": 23946 }, { "epoch": 0.65, "learning_rate": 5.649212729460176e-06, "loss": 1.2439, "step": 23947 }, { "epoch": 0.65, "learning_rate": 5.6484163429113585e-06, "loss": 1.344, "step": 23948 }, { "epoch": 0.65, "learning_rate": 5.647619990407278e-06, "loss": 1.3398, "step": 23949 }, { "epoch": 0.65, "learning_rate": 5.646823671954175e-06, "loss": 1.2358, "step": 23950 }, { "epoch": 0.65, "learning_rate": 5.646027387558273e-06, "loss": 1.1831, "step": 23951 }, { "epoch": 0.65, "learning_rate": 5.6452311372258126e-06, "loss": 1.2393, "step": 23952 }, { "epoch": 0.65, "learning_rate": 5.644434920963009e-06, "loss": 1.2957, "step": 23953 }, { "epoch": 0.65, "learning_rate": 5.643638738776103e-06, "loss": 1.2063, "step": 23954 }, { "epoch": 0.65, "learning_rate": 5.6428425906713135e-06, "loss": 1.3501, "step": 23955 }, { "epoch": 0.65, "learning_rate": 5.6420464766548835e-06, "loss": 1.4131, "step": 23956 }, { "epoch": 0.65, "learning_rate": 5.641250396733025e-06, "loss": 1.0547, "step": 23957 }, { "epoch": 0.65, "learning_rate": 5.640454350911977e-06, "loss": 1.397, "step": 23958 }, { "epoch": 0.65, "learning_rate": 5.639658339197959e-06, "loss": 1.3079, "step": 23959 }, { "epoch": 0.65, "learning_rate": 5.638862361597215e-06, "loss": 1.1598, "step": 23960 }, { "epoch": 0.65, "learning_rate": 5.6380664181159506e-06, "loss": 1.322, "step": 23961 }, { "epoch": 0.65, "learning_rate": 5.637270508760404e-06, "loss": 1.3616, "step": 23962 }, { "epoch": 0.65, "learning_rate": 5.636474633536806e-06, "loss": 1.3005, "step": 23963 }, { "epoch": 0.65, "learning_rate": 5.635678792451378e-06, "loss": 1.2925, "step": 23964 }, { "epoch": 0.65, "learning_rate": 5.634882985510348e-06, "loss": 1.0, "step": 23965 }, { "epoch": 0.65, "learning_rate": 5.634087212719936e-06, "loss": 1.2588, "step": 23966 }, { "epoch": 0.65, "learning_rate": 5.633291474086376e-06, "loss": 1.1697, "step": 23967 }, { "epoch": 0.65, "learning_rate": 5.632495769615891e-06, "loss": 1.293, "step": 23968 }, { "epoch": 0.65, "learning_rate": 5.631700099314705e-06, "loss": 1.2253, "step": 23969 }, { "epoch": 0.65, "learning_rate": 5.6309044631890395e-06, "loss": 1.3181, "step": 23970 }, { "epoch": 0.65, "learning_rate": 5.6301088612451275e-06, "loss": 1.1483, "step": 23971 }, { "epoch": 0.65, "learning_rate": 5.629313293489188e-06, "loss": 1.0419, "step": 23972 }, { "epoch": 0.65, "learning_rate": 5.628517759927446e-06, "loss": 1.4146, "step": 23973 }, { "epoch": 0.65, "learning_rate": 5.627722260566122e-06, "loss": 1.1467, "step": 23974 }, { "epoch": 0.65, "learning_rate": 5.626926795411447e-06, "loss": 1.4041, "step": 23975 }, { "epoch": 0.65, "learning_rate": 5.62613136446964e-06, "loss": 1.4241, "step": 23976 }, { "epoch": 0.65, "learning_rate": 5.625335967746921e-06, "loss": 1.2861, "step": 23977 }, { "epoch": 0.65, "learning_rate": 5.62454060524952e-06, "loss": 1.0273, "step": 23978 }, { "epoch": 0.65, "learning_rate": 5.623745276983656e-06, "loss": 1.3352, "step": 23979 }, { "epoch": 0.65, "learning_rate": 5.62294998295555e-06, "loss": 1.2, "step": 23980 }, { "epoch": 0.65, "learning_rate": 5.622154723171422e-06, "loss": 1.26, "step": 23981 }, { "epoch": 0.65, "learning_rate": 5.6213594976375016e-06, "loss": 1.3359, "step": 23982 }, { "epoch": 0.65, "learning_rate": 5.620564306360005e-06, "loss": 1.2136, "step": 23983 }, { "epoch": 0.65, "learning_rate": 5.619769149345153e-06, "loss": 1.2515, "step": 23984 }, { "epoch": 0.66, "learning_rate": 5.618974026599164e-06, "loss": 1.2402, "step": 23985 }, { "epoch": 0.66, "learning_rate": 5.618178938128267e-06, "loss": 1.3237, "step": 23986 }, { "epoch": 0.66, "learning_rate": 5.617383883938677e-06, "loss": 1.1479, "step": 23987 }, { "epoch": 0.66, "learning_rate": 5.616588864036614e-06, "loss": 1.1729, "step": 23988 }, { "epoch": 0.66, "learning_rate": 5.615793878428295e-06, "loss": 1.2065, "step": 23989 }, { "epoch": 0.66, "learning_rate": 5.614998927119947e-06, "loss": 1.1575, "step": 23990 }, { "epoch": 0.66, "learning_rate": 5.614204010117785e-06, "loss": 1.4482, "step": 23991 }, { "epoch": 0.66, "learning_rate": 5.6134091274280245e-06, "loss": 1.3469, "step": 23992 }, { "epoch": 0.66, "learning_rate": 5.612614279056893e-06, "loss": 1.2222, "step": 23993 }, { "epoch": 0.66, "learning_rate": 5.6118194650106e-06, "loss": 1.2529, "step": 23994 }, { "epoch": 0.66, "learning_rate": 5.611024685295376e-06, "loss": 1.2678, "step": 23995 }, { "epoch": 0.66, "learning_rate": 5.610229939917422e-06, "loss": 1.6636, "step": 23996 }, { "epoch": 0.66, "learning_rate": 5.609435228882971e-06, "loss": 1.2231, "step": 23997 }, { "epoch": 0.66, "learning_rate": 5.608640552198228e-06, "loss": 1.251, "step": 23998 }, { "epoch": 0.66, "learning_rate": 5.607845909869425e-06, "loss": 1.3462, "step": 23999 }, { "epoch": 0.66, "learning_rate": 5.607051301902764e-06, "loss": 1.2655, "step": 24000 }, { "epoch": 0.66, "learning_rate": 5.606256728304469e-06, "loss": 1.1724, "step": 24001 }, { "epoch": 0.66, "learning_rate": 5.605462189080753e-06, "loss": 1.3264, "step": 24002 }, { "epoch": 0.66, "learning_rate": 5.604667684237843e-06, "loss": 1.231, "step": 24003 }, { "epoch": 0.66, "learning_rate": 5.603873213781936e-06, "loss": 1.219, "step": 24004 }, { "epoch": 0.66, "learning_rate": 5.603078777719264e-06, "loss": 1.2356, "step": 24005 }, { "epoch": 0.66, "learning_rate": 5.602284376056031e-06, "loss": 1.1152, "step": 24006 }, { "epoch": 0.66, "learning_rate": 5.601490008798465e-06, "loss": 1.293, "step": 24007 }, { "epoch": 0.66, "learning_rate": 5.600695675952766e-06, "loss": 1.2644, "step": 24008 }, { "epoch": 0.66, "learning_rate": 5.599901377525153e-06, "loss": 1.27, "step": 24009 }, { "epoch": 0.66, "learning_rate": 5.599107113521849e-06, "loss": 1.4011, "step": 24010 }, { "epoch": 0.66, "learning_rate": 5.598312883949059e-06, "loss": 1.1799, "step": 24011 }, { "epoch": 0.66, "learning_rate": 5.597518688813002e-06, "loss": 1.0966, "step": 24012 }, { "epoch": 0.66, "learning_rate": 5.596724528119883e-06, "loss": 1.231, "step": 24013 }, { "epoch": 0.66, "learning_rate": 5.595930401875924e-06, "loss": 1.4082, "step": 24014 }, { "epoch": 0.66, "learning_rate": 5.5951363100873365e-06, "loss": 1.1626, "step": 24015 }, { "epoch": 0.66, "learning_rate": 5.594342252760329e-06, "loss": 1.3052, "step": 24016 }, { "epoch": 0.66, "learning_rate": 5.593548229901114e-06, "loss": 1.1187, "step": 24017 }, { "epoch": 0.66, "learning_rate": 5.592754241515909e-06, "loss": 1.2681, "step": 24018 }, { "epoch": 0.66, "learning_rate": 5.591960287610922e-06, "loss": 1.1033, "step": 24019 }, { "epoch": 0.66, "learning_rate": 5.5911663681923645e-06, "loss": 1.3962, "step": 24020 }, { "epoch": 0.66, "learning_rate": 5.590372483266446e-06, "loss": 1.3586, "step": 24021 }, { "epoch": 0.66, "learning_rate": 5.589578632839382e-06, "loss": 1.2446, "step": 24022 }, { "epoch": 0.66, "learning_rate": 5.5887848169173805e-06, "loss": 1.2554, "step": 24023 }, { "epoch": 0.66, "learning_rate": 5.5879910355066505e-06, "loss": 1.2041, "step": 24024 }, { "epoch": 0.66, "learning_rate": 5.587197288613406e-06, "loss": 1.1836, "step": 24025 }, { "epoch": 0.66, "learning_rate": 5.586403576243855e-06, "loss": 1.2019, "step": 24026 }, { "epoch": 0.66, "learning_rate": 5.585609898404207e-06, "loss": 1.29, "step": 24027 }, { "epoch": 0.66, "learning_rate": 5.584816255100669e-06, "loss": 1.355, "step": 24028 }, { "epoch": 0.66, "learning_rate": 5.584022646339456e-06, "loss": 1.4136, "step": 24029 }, { "epoch": 0.66, "learning_rate": 5.583229072126771e-06, "loss": 1.3228, "step": 24030 }, { "epoch": 0.66, "learning_rate": 5.582435532468826e-06, "loss": 1.3003, "step": 24031 }, { "epoch": 0.66, "learning_rate": 5.581642027371826e-06, "loss": 1.2744, "step": 24032 }, { "epoch": 0.66, "learning_rate": 5.5808485568419825e-06, "loss": 1.3271, "step": 24033 }, { "epoch": 0.66, "learning_rate": 5.580055120885503e-06, "loss": 1.3381, "step": 24034 }, { "epoch": 0.66, "learning_rate": 5.579261719508593e-06, "loss": 1.2346, "step": 24035 }, { "epoch": 0.66, "learning_rate": 5.578468352717458e-06, "loss": 1.3079, "step": 24036 }, { "epoch": 0.66, "learning_rate": 5.577675020518311e-06, "loss": 1.3914, "step": 24037 }, { "epoch": 0.66, "learning_rate": 5.576881722917355e-06, "loss": 1.4033, "step": 24038 }, { "epoch": 0.66, "learning_rate": 5.576088459920792e-06, "loss": 1.2385, "step": 24039 }, { "epoch": 0.66, "learning_rate": 5.575295231534836e-06, "loss": 1.1531, "step": 24040 }, { "epoch": 0.66, "learning_rate": 5.5745020377656875e-06, "loss": 1.2773, "step": 24041 }, { "epoch": 0.66, "learning_rate": 5.5737088786195605e-06, "loss": 1.2393, "step": 24042 }, { "epoch": 0.66, "learning_rate": 5.572915754102646e-06, "loss": 1.1018, "step": 24043 }, { "epoch": 0.66, "learning_rate": 5.5721226642211625e-06, "loss": 1.2581, "step": 24044 }, { "epoch": 0.66, "learning_rate": 5.571329608981303e-06, "loss": 1.3215, "step": 24045 }, { "epoch": 0.66, "learning_rate": 5.570536588389287e-06, "loss": 1.0581, "step": 24046 }, { "epoch": 0.66, "learning_rate": 5.5697436024513015e-06, "loss": 1.2397, "step": 24047 }, { "epoch": 0.66, "learning_rate": 5.568950651173563e-06, "loss": 1.3535, "step": 24048 }, { "epoch": 0.66, "learning_rate": 5.568157734562267e-06, "loss": 1.2922, "step": 24049 }, { "epoch": 0.66, "learning_rate": 5.567364852623629e-06, "loss": 1.2385, "step": 24050 }, { "epoch": 0.66, "learning_rate": 5.566572005363836e-06, "loss": 1.6909, "step": 24051 }, { "epoch": 0.66, "learning_rate": 5.565779192789103e-06, "loss": 1.4028, "step": 24052 }, { "epoch": 0.66, "learning_rate": 5.564986414905624e-06, "loss": 1.2156, "step": 24053 }, { "epoch": 0.66, "learning_rate": 5.564193671719611e-06, "loss": 1.2749, "step": 24054 }, { "epoch": 0.66, "learning_rate": 5.56340096323726e-06, "loss": 1.1814, "step": 24055 }, { "epoch": 0.66, "learning_rate": 5.562608289464769e-06, "loss": 1.3633, "step": 24056 }, { "epoch": 0.66, "learning_rate": 5.561815650408348e-06, "loss": 1.406, "step": 24057 }, { "epoch": 0.66, "learning_rate": 5.5610230460741964e-06, "loss": 1.3699, "step": 24058 }, { "epoch": 0.66, "learning_rate": 5.5602304764685114e-06, "loss": 1.397, "step": 24059 }, { "epoch": 0.66, "learning_rate": 5.559437941597492e-06, "loss": 1.2661, "step": 24060 }, { "epoch": 0.66, "learning_rate": 5.558645441467347e-06, "loss": 1.2612, "step": 24061 }, { "epoch": 0.66, "learning_rate": 5.557852976084271e-06, "loss": 1.2888, "step": 24062 }, { "epoch": 0.66, "learning_rate": 5.557060545454462e-06, "loss": 1.1458, "step": 24063 }, { "epoch": 0.66, "learning_rate": 5.556268149584121e-06, "loss": 1.2053, "step": 24064 }, { "epoch": 0.66, "learning_rate": 5.555475788479452e-06, "loss": 1.2698, "step": 24065 }, { "epoch": 0.66, "learning_rate": 5.554683462146649e-06, "loss": 1.3101, "step": 24066 }, { "epoch": 0.66, "learning_rate": 5.553891170591914e-06, "loss": 1.2502, "step": 24067 }, { "epoch": 0.66, "learning_rate": 5.553098913821439e-06, "loss": 1.1667, "step": 24068 }, { "epoch": 0.66, "learning_rate": 5.5523066918414315e-06, "loss": 1.1851, "step": 24069 }, { "epoch": 0.66, "learning_rate": 5.551514504658085e-06, "loss": 1.2795, "step": 24070 }, { "epoch": 0.66, "learning_rate": 5.550722352277591e-06, "loss": 1.342, "step": 24071 }, { "epoch": 0.66, "learning_rate": 5.54993023470616e-06, "loss": 1.3916, "step": 24072 }, { "epoch": 0.66, "learning_rate": 5.54913815194998e-06, "loss": 1.2671, "step": 24073 }, { "epoch": 0.66, "learning_rate": 5.548346104015252e-06, "loss": 1.3635, "step": 24074 }, { "epoch": 0.66, "learning_rate": 5.547554090908166e-06, "loss": 1.394, "step": 24075 }, { "epoch": 0.66, "learning_rate": 5.546762112634927e-06, "loss": 1.2573, "step": 24076 }, { "epoch": 0.66, "learning_rate": 5.5459701692017264e-06, "loss": 1.2783, "step": 24077 }, { "epoch": 0.66, "learning_rate": 5.545178260614763e-06, "loss": 1.4324, "step": 24078 }, { "epoch": 0.66, "learning_rate": 5.544386386880225e-06, "loss": 1.3794, "step": 24079 }, { "epoch": 0.66, "learning_rate": 5.543594548004316e-06, "loss": 1.4814, "step": 24080 }, { "epoch": 0.66, "learning_rate": 5.5428027439932274e-06, "loss": 1.3206, "step": 24081 }, { "epoch": 0.66, "learning_rate": 5.542010974853156e-06, "loss": 1.4268, "step": 24082 }, { "epoch": 0.66, "learning_rate": 5.541219240590289e-06, "loss": 1.0935, "step": 24083 }, { "epoch": 0.66, "learning_rate": 5.540427541210831e-06, "loss": 1.3318, "step": 24084 }, { "epoch": 0.66, "learning_rate": 5.53963587672097e-06, "loss": 1.2146, "step": 24085 }, { "epoch": 0.66, "learning_rate": 5.538844247126897e-06, "loss": 1.3143, "step": 24086 }, { "epoch": 0.66, "learning_rate": 5.538052652434812e-06, "loss": 1.2922, "step": 24087 }, { "epoch": 0.66, "learning_rate": 5.537261092650902e-06, "loss": 1.2034, "step": 24088 }, { "epoch": 0.66, "learning_rate": 5.53646956778137e-06, "loss": 1.3228, "step": 24089 }, { "epoch": 0.66, "learning_rate": 5.535678077832394e-06, "loss": 1.0642, "step": 24090 }, { "epoch": 0.66, "learning_rate": 5.534886622810176e-06, "loss": 1.1729, "step": 24091 }, { "epoch": 0.66, "learning_rate": 5.5340952027209015e-06, "loss": 1.3606, "step": 24092 }, { "epoch": 0.66, "learning_rate": 5.533303817570776e-06, "loss": 1.3103, "step": 24093 }, { "epoch": 0.66, "learning_rate": 5.532512467365971e-06, "loss": 1.094, "step": 24094 }, { "epoch": 0.66, "learning_rate": 5.531721152112693e-06, "loss": 1.2583, "step": 24095 }, { "epoch": 0.66, "learning_rate": 5.530929871817124e-06, "loss": 1.2546, "step": 24096 }, { "epoch": 0.66, "learning_rate": 5.530138626485465e-06, "loss": 1.2852, "step": 24097 }, { "epoch": 0.66, "learning_rate": 5.529347416123891e-06, "loss": 1.3269, "step": 24098 }, { "epoch": 0.66, "learning_rate": 5.528556240738606e-06, "loss": 1.3462, "step": 24099 }, { "epoch": 0.66, "learning_rate": 5.52776510033579e-06, "loss": 1.1995, "step": 24100 }, { "epoch": 0.66, "learning_rate": 5.5269739949216405e-06, "loss": 1.3364, "step": 24101 }, { "epoch": 0.66, "learning_rate": 5.526182924502344e-06, "loss": 1.1448, "step": 24102 }, { "epoch": 0.66, "learning_rate": 5.525391889084084e-06, "loss": 1.488, "step": 24103 }, { "epoch": 0.66, "learning_rate": 5.524600888673058e-06, "loss": 1.3184, "step": 24104 }, { "epoch": 0.66, "learning_rate": 5.523809923275449e-06, "loss": 1.1587, "step": 24105 }, { "epoch": 0.66, "learning_rate": 5.523018992897446e-06, "loss": 1.2751, "step": 24106 }, { "epoch": 0.66, "learning_rate": 5.522228097545235e-06, "loss": 1.175, "step": 24107 }, { "epoch": 0.66, "learning_rate": 5.521437237225009e-06, "loss": 1.3408, "step": 24108 }, { "epoch": 0.66, "learning_rate": 5.520646411942952e-06, "loss": 1.2031, "step": 24109 }, { "epoch": 0.66, "learning_rate": 5.519855621705252e-06, "loss": 1.4062, "step": 24110 }, { "epoch": 0.66, "learning_rate": 5.519064866518089e-06, "loss": 1.2588, "step": 24111 }, { "epoch": 0.66, "learning_rate": 5.518274146387661e-06, "loss": 1.4412, "step": 24112 }, { "epoch": 0.66, "learning_rate": 5.517483461320148e-06, "loss": 1.2388, "step": 24113 }, { "epoch": 0.66, "learning_rate": 5.5166928113217365e-06, "loss": 1.365, "step": 24114 }, { "epoch": 0.66, "learning_rate": 5.5159021963986085e-06, "loss": 1.3684, "step": 24115 }, { "epoch": 0.66, "learning_rate": 5.515111616556958e-06, "loss": 1.2312, "step": 24116 }, { "epoch": 0.66, "learning_rate": 5.514321071802964e-06, "loss": 1.2876, "step": 24117 }, { "epoch": 0.66, "learning_rate": 5.513530562142808e-06, "loss": 1.3359, "step": 24118 }, { "epoch": 0.66, "learning_rate": 5.512740087582685e-06, "loss": 1.3828, "step": 24119 }, { "epoch": 0.66, "learning_rate": 5.511949648128773e-06, "loss": 1.197, "step": 24120 }, { "epoch": 0.66, "learning_rate": 5.5111592437872565e-06, "loss": 1.3074, "step": 24121 }, { "epoch": 0.66, "learning_rate": 5.510368874564315e-06, "loss": 1.3569, "step": 24122 }, { "epoch": 0.66, "learning_rate": 5.509578540466139e-06, "loss": 1.1455, "step": 24123 }, { "epoch": 0.66, "learning_rate": 5.5087882414989106e-06, "loss": 1.0925, "step": 24124 }, { "epoch": 0.66, "learning_rate": 5.507997977668811e-06, "loss": 1.1487, "step": 24125 }, { "epoch": 0.66, "learning_rate": 5.507207748982019e-06, "loss": 1.3533, "step": 24126 }, { "epoch": 0.66, "learning_rate": 5.506417555444724e-06, "loss": 1.2747, "step": 24127 }, { "epoch": 0.66, "learning_rate": 5.505627397063106e-06, "loss": 1.4421, "step": 24128 }, { "epoch": 0.66, "learning_rate": 5.504837273843344e-06, "loss": 1.2859, "step": 24129 }, { "epoch": 0.66, "learning_rate": 5.50404718579162e-06, "loss": 1.3389, "step": 24130 }, { "epoch": 0.66, "learning_rate": 5.503257132914119e-06, "loss": 1.3008, "step": 24131 }, { "epoch": 0.66, "learning_rate": 5.5024671152170205e-06, "loss": 1.0273, "step": 24132 }, { "epoch": 0.66, "learning_rate": 5.5016771327065e-06, "loss": 1.2944, "step": 24133 }, { "epoch": 0.66, "learning_rate": 5.5008871853887455e-06, "loss": 1.3508, "step": 24134 }, { "epoch": 0.66, "learning_rate": 5.500097273269932e-06, "loss": 1.2761, "step": 24135 }, { "epoch": 0.66, "learning_rate": 5.499307396356248e-06, "loss": 1.3823, "step": 24136 }, { "epoch": 0.66, "learning_rate": 5.498517554653859e-06, "loss": 1.3533, "step": 24137 }, { "epoch": 0.66, "learning_rate": 5.497727748168955e-06, "loss": 1.198, "step": 24138 }, { "epoch": 0.66, "learning_rate": 5.4969379769077105e-06, "loss": 1.2395, "step": 24139 }, { "epoch": 0.66, "learning_rate": 5.496148240876307e-06, "loss": 1.3794, "step": 24140 }, { "epoch": 0.66, "learning_rate": 5.495358540080923e-06, "loss": 1.0933, "step": 24141 }, { "epoch": 0.66, "learning_rate": 5.494568874527735e-06, "loss": 1.3818, "step": 24142 }, { "epoch": 0.66, "learning_rate": 5.493779244222919e-06, "loss": 1.2131, "step": 24143 }, { "epoch": 0.66, "learning_rate": 5.492989649172657e-06, "loss": 1.189, "step": 24144 }, { "epoch": 0.66, "learning_rate": 5.492200089383126e-06, "loss": 1.0139, "step": 24145 }, { "epoch": 0.66, "learning_rate": 5.491410564860502e-06, "loss": 1.2622, "step": 24146 }, { "epoch": 0.66, "learning_rate": 5.490621075610958e-06, "loss": 1.3201, "step": 24147 }, { "epoch": 0.66, "learning_rate": 5.489831621640677e-06, "loss": 1.2581, "step": 24148 }, { "epoch": 0.66, "learning_rate": 5.4890422029558325e-06, "loss": 1.1748, "step": 24149 }, { "epoch": 0.66, "learning_rate": 5.488252819562597e-06, "loss": 1.1899, "step": 24150 }, { "epoch": 0.66, "learning_rate": 5.487463471467154e-06, "loss": 1.1157, "step": 24151 }, { "epoch": 0.66, "learning_rate": 5.486674158675676e-06, "loss": 1.314, "step": 24152 }, { "epoch": 0.66, "learning_rate": 5.485884881194336e-06, "loss": 1.314, "step": 24153 }, { "epoch": 0.66, "learning_rate": 5.485095639029305e-06, "loss": 1.3843, "step": 24154 }, { "epoch": 0.66, "learning_rate": 5.484306432186768e-06, "loss": 1.2239, "step": 24155 }, { "epoch": 0.66, "learning_rate": 5.483517260672894e-06, "loss": 1.1125, "step": 24156 }, { "epoch": 0.66, "learning_rate": 5.482728124493857e-06, "loss": 1.345, "step": 24157 }, { "epoch": 0.66, "learning_rate": 5.481939023655827e-06, "loss": 1.7168, "step": 24158 }, { "epoch": 0.66, "learning_rate": 5.481149958164984e-06, "loss": 1.3057, "step": 24159 }, { "epoch": 0.66, "learning_rate": 5.4803609280275e-06, "loss": 1.2532, "step": 24160 }, { "epoch": 0.66, "learning_rate": 5.4795719332495475e-06, "loss": 1.2539, "step": 24161 }, { "epoch": 0.66, "learning_rate": 5.478782973837294e-06, "loss": 1.2737, "step": 24162 }, { "epoch": 0.66, "learning_rate": 5.47799404979692e-06, "loss": 1.1217, "step": 24163 }, { "epoch": 0.66, "learning_rate": 5.4772051611345955e-06, "loss": 1.1621, "step": 24164 }, { "epoch": 0.66, "learning_rate": 5.476416307856486e-06, "loss": 1.4219, "step": 24165 }, { "epoch": 0.66, "learning_rate": 5.4756274899687726e-06, "loss": 1.3345, "step": 24166 }, { "epoch": 0.66, "learning_rate": 5.474838707477621e-06, "loss": 1.283, "step": 24167 }, { "epoch": 0.66, "learning_rate": 5.474049960389205e-06, "loss": 1.3911, "step": 24168 }, { "epoch": 0.66, "learning_rate": 5.473261248709689e-06, "loss": 1.3191, "step": 24169 }, { "epoch": 0.66, "learning_rate": 5.472472572445254e-06, "loss": 1.2012, "step": 24170 }, { "epoch": 0.66, "learning_rate": 5.471683931602062e-06, "loss": 1.1938, "step": 24171 }, { "epoch": 0.66, "learning_rate": 5.470895326186288e-06, "loss": 1.2712, "step": 24172 }, { "epoch": 0.66, "learning_rate": 5.470106756204093e-06, "loss": 1.3923, "step": 24173 }, { "epoch": 0.66, "learning_rate": 5.469318221661658e-06, "loss": 1.3914, "step": 24174 }, { "epoch": 0.66, "learning_rate": 5.468529722565142e-06, "loss": 1.1704, "step": 24175 }, { "epoch": 0.66, "learning_rate": 5.467741258920727e-06, "loss": 1.157, "step": 24176 }, { "epoch": 0.66, "learning_rate": 5.466952830734565e-06, "loss": 1.2322, "step": 24177 }, { "epoch": 0.66, "learning_rate": 5.466164438012833e-06, "loss": 1.0394, "step": 24178 }, { "epoch": 0.66, "learning_rate": 5.465376080761702e-06, "loss": 1.3477, "step": 24179 }, { "epoch": 0.66, "learning_rate": 5.464587758987336e-06, "loss": 1.3105, "step": 24180 }, { "epoch": 0.66, "learning_rate": 5.4637994726959035e-06, "loss": 1.1077, "step": 24181 }, { "epoch": 0.66, "learning_rate": 5.463011221893566e-06, "loss": 1.3455, "step": 24182 }, { "epoch": 0.66, "learning_rate": 5.4622230065865e-06, "loss": 1.3003, "step": 24183 }, { "epoch": 0.66, "learning_rate": 5.461434826780867e-06, "loss": 1.3408, "step": 24184 }, { "epoch": 0.66, "learning_rate": 5.460646682482834e-06, "loss": 1.2229, "step": 24185 }, { "epoch": 0.66, "learning_rate": 5.459858573698562e-06, "loss": 1.2239, "step": 24186 }, { "epoch": 0.66, "learning_rate": 5.459070500434227e-06, "loss": 1.1975, "step": 24187 }, { "epoch": 0.66, "learning_rate": 5.458282462695988e-06, "loss": 1.1873, "step": 24188 }, { "epoch": 0.66, "learning_rate": 5.457494460490012e-06, "loss": 1.2471, "step": 24189 }, { "epoch": 0.66, "learning_rate": 5.456706493822459e-06, "loss": 1.2664, "step": 24190 }, { "epoch": 0.66, "learning_rate": 5.455918562699503e-06, "loss": 1.3054, "step": 24191 }, { "epoch": 0.66, "learning_rate": 5.4551306671273015e-06, "loss": 1.3254, "step": 24192 }, { "epoch": 0.66, "learning_rate": 5.4543428071120205e-06, "loss": 1.1992, "step": 24193 }, { "epoch": 0.66, "learning_rate": 5.453554982659821e-06, "loss": 1.1033, "step": 24194 }, { "epoch": 0.66, "learning_rate": 5.452767193776874e-06, "loss": 1.4233, "step": 24195 }, { "epoch": 0.66, "learning_rate": 5.451979440469337e-06, "loss": 1.365, "step": 24196 }, { "epoch": 0.66, "learning_rate": 5.4511917227433695e-06, "loss": 1.218, "step": 24197 }, { "epoch": 0.66, "learning_rate": 5.450404040605144e-06, "loss": 1.2053, "step": 24198 }, { "epoch": 0.66, "learning_rate": 5.449616394060819e-06, "loss": 1.2136, "step": 24199 }, { "epoch": 0.66, "learning_rate": 5.4488287831165544e-06, "loss": 1.0475, "step": 24200 }, { "epoch": 0.66, "learning_rate": 5.448041207778509e-06, "loss": 1.3101, "step": 24201 }, { "epoch": 0.66, "learning_rate": 5.4472536680528536e-06, "loss": 1.729, "step": 24202 }, { "epoch": 0.66, "learning_rate": 5.446466163945744e-06, "loss": 1.2778, "step": 24203 }, { "epoch": 0.66, "learning_rate": 5.445678695463341e-06, "loss": 1.2766, "step": 24204 }, { "epoch": 0.66, "learning_rate": 5.444891262611804e-06, "loss": 1.2747, "step": 24205 }, { "epoch": 0.66, "learning_rate": 5.444103865397299e-06, "loss": 1.3179, "step": 24206 }, { "epoch": 0.66, "learning_rate": 5.443316503825984e-06, "loss": 1.2356, "step": 24207 }, { "epoch": 0.66, "learning_rate": 5.4425291779040165e-06, "loss": 1.3284, "step": 24208 }, { "epoch": 0.66, "learning_rate": 5.441741887637555e-06, "loss": 1.2939, "step": 24209 }, { "epoch": 0.66, "learning_rate": 5.44095463303276e-06, "loss": 1.166, "step": 24210 }, { "epoch": 0.66, "learning_rate": 5.440167414095802e-06, "loss": 1.1472, "step": 24211 }, { "epoch": 0.66, "learning_rate": 5.43938023083282e-06, "loss": 1.3035, "step": 24212 }, { "epoch": 0.66, "learning_rate": 5.438593083249988e-06, "loss": 1.2742, "step": 24213 }, { "epoch": 0.66, "learning_rate": 5.437805971353454e-06, "loss": 1.1624, "step": 24214 }, { "epoch": 0.66, "learning_rate": 5.437018895149389e-06, "loss": 1.3372, "step": 24215 }, { "epoch": 0.66, "learning_rate": 5.436231854643934e-06, "loss": 1.2356, "step": 24216 }, { "epoch": 0.66, "learning_rate": 5.435444849843261e-06, "loss": 1.4285, "step": 24217 }, { "epoch": 0.66, "learning_rate": 5.434657880753516e-06, "loss": 1.374, "step": 24218 }, { "epoch": 0.66, "learning_rate": 5.433870947380868e-06, "loss": 1.2427, "step": 24219 }, { "epoch": 0.66, "learning_rate": 5.4330840497314584e-06, "loss": 1.3057, "step": 24220 }, { "epoch": 0.66, "learning_rate": 5.432297187811457e-06, "loss": 1.26, "step": 24221 }, { "epoch": 0.66, "learning_rate": 5.43151036162701e-06, "loss": 1.2014, "step": 24222 }, { "epoch": 0.66, "learning_rate": 5.430723571184284e-06, "loss": 1.0911, "step": 24223 }, { "epoch": 0.66, "learning_rate": 5.4299368164894224e-06, "loss": 1.2361, "step": 24224 }, { "epoch": 0.66, "learning_rate": 5.429150097548585e-06, "loss": 1.2781, "step": 24225 }, { "epoch": 0.66, "learning_rate": 5.428363414367933e-06, "loss": 1.3723, "step": 24226 }, { "epoch": 0.66, "learning_rate": 5.427576766953615e-06, "loss": 1.4194, "step": 24227 }, { "epoch": 0.66, "learning_rate": 5.426790155311787e-06, "loss": 1.0903, "step": 24228 }, { "epoch": 0.66, "learning_rate": 5.426003579448598e-06, "loss": 1.1299, "step": 24229 }, { "epoch": 0.66, "learning_rate": 5.42521703937021e-06, "loss": 1.2739, "step": 24230 }, { "epoch": 0.66, "learning_rate": 5.424430535082772e-06, "loss": 1.3228, "step": 24231 }, { "epoch": 0.66, "learning_rate": 5.42364406659244e-06, "loss": 1.2107, "step": 24232 }, { "epoch": 0.66, "learning_rate": 5.422857633905358e-06, "loss": 1.3972, "step": 24233 }, { "epoch": 0.66, "learning_rate": 5.422071237027692e-06, "loss": 1.3967, "step": 24234 }, { "epoch": 0.66, "learning_rate": 5.421284875965587e-06, "loss": 1.3293, "step": 24235 }, { "epoch": 0.66, "learning_rate": 5.420498550725195e-06, "loss": 1.3367, "step": 24236 }, { "epoch": 0.66, "learning_rate": 5.419712261312666e-06, "loss": 1.282, "step": 24237 }, { "epoch": 0.66, "learning_rate": 5.418926007734159e-06, "loss": 1.2295, "step": 24238 }, { "epoch": 0.66, "learning_rate": 5.41813978999582e-06, "loss": 1.3789, "step": 24239 }, { "epoch": 0.66, "learning_rate": 5.4173536081037965e-06, "loss": 1.3125, "step": 24240 }, { "epoch": 0.66, "learning_rate": 5.416567462064248e-06, "loss": 1.0242, "step": 24241 }, { "epoch": 0.66, "learning_rate": 5.41578135188332e-06, "loss": 1.4556, "step": 24242 }, { "epoch": 0.66, "learning_rate": 5.4149952775671635e-06, "loss": 1.4219, "step": 24243 }, { "epoch": 0.66, "learning_rate": 5.4142092391219235e-06, "loss": 1.2427, "step": 24244 }, { "epoch": 0.66, "learning_rate": 5.4134232365537585e-06, "loss": 1.3423, "step": 24245 }, { "epoch": 0.66, "learning_rate": 5.412637269868814e-06, "loss": 1.3601, "step": 24246 }, { "epoch": 0.66, "learning_rate": 5.4118513390732374e-06, "loss": 1.2432, "step": 24247 }, { "epoch": 0.66, "learning_rate": 5.4110654441731735e-06, "loss": 1.2976, "step": 24248 }, { "epoch": 0.66, "learning_rate": 5.4102795851747815e-06, "loss": 1.1545, "step": 24249 }, { "epoch": 0.66, "learning_rate": 5.409493762084202e-06, "loss": 1.3525, "step": 24250 }, { "epoch": 0.66, "learning_rate": 5.408707974907586e-06, "loss": 1.1807, "step": 24251 }, { "epoch": 0.66, "learning_rate": 5.407922223651076e-06, "loss": 1.7393, "step": 24252 }, { "epoch": 0.66, "learning_rate": 5.4071365083208274e-06, "loss": 1.3984, "step": 24253 }, { "epoch": 0.66, "learning_rate": 5.406350828922982e-06, "loss": 1.0889, "step": 24254 }, { "epoch": 0.66, "learning_rate": 5.4055651854636885e-06, "loss": 1.387, "step": 24255 }, { "epoch": 0.66, "learning_rate": 5.404779577949086e-06, "loss": 1.2561, "step": 24256 }, { "epoch": 0.66, "learning_rate": 5.4039940063853304e-06, "loss": 1.187, "step": 24257 }, { "epoch": 0.66, "learning_rate": 5.403208470778571e-06, "loss": 1.3467, "step": 24258 }, { "epoch": 0.66, "learning_rate": 5.40242297113494e-06, "loss": 1.3542, "step": 24259 }, { "epoch": 0.66, "learning_rate": 5.4016375074605935e-06, "loss": 1.2468, "step": 24260 }, { "epoch": 0.66, "learning_rate": 5.400852079761667e-06, "loss": 1.28, "step": 24261 }, { "epoch": 0.66, "learning_rate": 5.400066688044321e-06, "loss": 1.2888, "step": 24262 }, { "epoch": 0.66, "learning_rate": 5.399281332314681e-06, "loss": 1.271, "step": 24263 }, { "epoch": 0.66, "learning_rate": 5.398496012578907e-06, "loss": 1.2969, "step": 24264 }, { "epoch": 0.66, "learning_rate": 5.39771072884313e-06, "loss": 1.3696, "step": 24265 }, { "epoch": 0.66, "learning_rate": 5.396925481113509e-06, "loss": 1.3179, "step": 24266 }, { "epoch": 0.66, "learning_rate": 5.396140269396169e-06, "loss": 1.2524, "step": 24267 }, { "epoch": 0.66, "learning_rate": 5.395355093697268e-06, "loss": 1.3486, "step": 24268 }, { "epoch": 0.66, "learning_rate": 5.394569954022939e-06, "loss": 1.3591, "step": 24269 }, { "epoch": 0.66, "learning_rate": 5.393784850379338e-06, "loss": 1.2216, "step": 24270 }, { "epoch": 0.66, "learning_rate": 5.39299978277259e-06, "loss": 1.2717, "step": 24271 }, { "epoch": 0.66, "learning_rate": 5.392214751208844e-06, "loss": 1.3408, "step": 24272 }, { "epoch": 0.66, "learning_rate": 5.391429755694249e-06, "loss": 1.2256, "step": 24273 }, { "epoch": 0.66, "learning_rate": 5.39064479623494e-06, "loss": 1.4153, "step": 24274 }, { "epoch": 0.66, "learning_rate": 5.389859872837057e-06, "loss": 1.1921, "step": 24275 }, { "epoch": 0.66, "learning_rate": 5.38907498550674e-06, "loss": 1.2202, "step": 24276 }, { "epoch": 0.66, "learning_rate": 5.388290134250136e-06, "loss": 1.2146, "step": 24277 }, { "epoch": 0.66, "learning_rate": 5.387505319073382e-06, "loss": 1.2368, "step": 24278 }, { "epoch": 0.66, "learning_rate": 5.386720539982617e-06, "loss": 1.1523, "step": 24279 }, { "epoch": 0.66, "learning_rate": 5.385935796983976e-06, "loss": 1.3442, "step": 24280 }, { "epoch": 0.66, "learning_rate": 5.385151090083609e-06, "loss": 1.2051, "step": 24281 }, { "epoch": 0.66, "learning_rate": 5.38436641928765e-06, "loss": 1.1841, "step": 24282 }, { "epoch": 0.66, "learning_rate": 5.383581784602237e-06, "loss": 1.2654, "step": 24283 }, { "epoch": 0.66, "learning_rate": 5.3827971860335045e-06, "loss": 1.2463, "step": 24284 }, { "epoch": 0.66, "learning_rate": 5.3820126235876e-06, "loss": 1.176, "step": 24285 }, { "epoch": 0.66, "learning_rate": 5.381228097270658e-06, "loss": 1.4075, "step": 24286 }, { "epoch": 0.66, "learning_rate": 5.380443607088812e-06, "loss": 1.4458, "step": 24287 }, { "epoch": 0.66, "learning_rate": 5.379659153048207e-06, "loss": 1.2278, "step": 24288 }, { "epoch": 0.66, "learning_rate": 5.378874735154974e-06, "loss": 1.2332, "step": 24289 }, { "epoch": 0.66, "learning_rate": 5.378090353415253e-06, "loss": 1.228, "step": 24290 }, { "epoch": 0.66, "learning_rate": 5.377306007835177e-06, "loss": 1.2791, "step": 24291 }, { "epoch": 0.66, "learning_rate": 5.376521698420888e-06, "loss": 1.2947, "step": 24292 }, { "epoch": 0.66, "learning_rate": 5.3757374251785196e-06, "loss": 1.2471, "step": 24293 }, { "epoch": 0.66, "learning_rate": 5.374953188114207e-06, "loss": 1.1604, "step": 24294 }, { "epoch": 0.66, "learning_rate": 5.3741689872340805e-06, "loss": 1.2689, "step": 24295 }, { "epoch": 0.66, "learning_rate": 5.373384822544285e-06, "loss": 1.231, "step": 24296 }, { "epoch": 0.66, "learning_rate": 5.3726006940509535e-06, "loss": 1.3, "step": 24297 }, { "epoch": 0.66, "learning_rate": 5.371816601760216e-06, "loss": 1.2363, "step": 24298 }, { "epoch": 0.66, "learning_rate": 5.3710325456782054e-06, "loss": 1.4136, "step": 24299 }, { "epoch": 0.66, "learning_rate": 5.370248525811064e-06, "loss": 1.2471, "step": 24300 }, { "epoch": 0.66, "learning_rate": 5.36946454216492e-06, "loss": 1.1582, "step": 24301 }, { "epoch": 0.66, "learning_rate": 5.3686805947459096e-06, "loss": 1.1458, "step": 24302 }, { "epoch": 0.66, "learning_rate": 5.367896683560159e-06, "loss": 1.2866, "step": 24303 }, { "epoch": 0.66, "learning_rate": 5.367112808613807e-06, "loss": 1.3569, "step": 24304 }, { "epoch": 0.66, "learning_rate": 5.366328969912994e-06, "loss": 1.2445, "step": 24305 }, { "epoch": 0.66, "learning_rate": 5.365545167463836e-06, "loss": 1.0781, "step": 24306 }, { "epoch": 0.66, "learning_rate": 5.364761401272478e-06, "loss": 1.2732, "step": 24307 }, { "epoch": 0.66, "learning_rate": 5.363977671345042e-06, "loss": 1.4478, "step": 24308 }, { "epoch": 0.66, "learning_rate": 5.363193977687673e-06, "loss": 1.1157, "step": 24309 }, { "epoch": 0.66, "learning_rate": 5.362410320306487e-06, "loss": 1.375, "step": 24310 }, { "epoch": 0.66, "learning_rate": 5.361626699207625e-06, "loss": 1.2646, "step": 24311 }, { "epoch": 0.66, "learning_rate": 5.360843114397212e-06, "loss": 1.2358, "step": 24312 }, { "epoch": 0.66, "learning_rate": 5.3600595658813855e-06, "loss": 1.3027, "step": 24313 }, { "epoch": 0.66, "learning_rate": 5.359276053666267e-06, "loss": 1.4292, "step": 24314 }, { "epoch": 0.66, "learning_rate": 5.358492577757992e-06, "loss": 1.2224, "step": 24315 }, { "epoch": 0.66, "learning_rate": 5.357709138162686e-06, "loss": 1.3647, "step": 24316 }, { "epoch": 0.66, "learning_rate": 5.356925734886488e-06, "loss": 1.2437, "step": 24317 }, { "epoch": 0.66, "learning_rate": 5.356142367935512e-06, "loss": 1.2173, "step": 24318 }, { "epoch": 0.66, "learning_rate": 5.355359037315893e-06, "loss": 1.4521, "step": 24319 }, { "epoch": 0.66, "learning_rate": 5.354575743033767e-06, "loss": 1.22, "step": 24320 }, { "epoch": 0.66, "learning_rate": 5.353792485095255e-06, "loss": 1.2356, "step": 24321 }, { "epoch": 0.66, "learning_rate": 5.3530092635064855e-06, "loss": 1.365, "step": 24322 }, { "epoch": 0.66, "learning_rate": 5.3522260782735825e-06, "loss": 1.2017, "step": 24323 }, { "epoch": 0.66, "learning_rate": 5.3514429294026815e-06, "loss": 1.1797, "step": 24324 }, { "epoch": 0.66, "learning_rate": 5.350659816899905e-06, "loss": 1.3113, "step": 24325 }, { "epoch": 0.66, "learning_rate": 5.3498767407713795e-06, "loss": 1.3037, "step": 24326 }, { "epoch": 0.66, "learning_rate": 5.349093701023228e-06, "loss": 1.2556, "step": 24327 }, { "epoch": 0.66, "learning_rate": 5.348310697661584e-06, "loss": 1.2329, "step": 24328 }, { "epoch": 0.66, "learning_rate": 5.34752773069257e-06, "loss": 1.3245, "step": 24329 }, { "epoch": 0.66, "learning_rate": 5.346744800122312e-06, "loss": 1.3652, "step": 24330 }, { "epoch": 0.66, "learning_rate": 5.345961905956929e-06, "loss": 1.1682, "step": 24331 }, { "epoch": 0.66, "learning_rate": 5.345179048202556e-06, "loss": 1.1008, "step": 24332 }, { "epoch": 0.66, "learning_rate": 5.344396226865314e-06, "loss": 1.2117, "step": 24333 }, { "epoch": 0.66, "learning_rate": 5.343613441951323e-06, "loss": 1.1377, "step": 24334 }, { "epoch": 0.66, "learning_rate": 5.342830693466714e-06, "loss": 1.3096, "step": 24335 }, { "epoch": 0.66, "learning_rate": 5.3420479814176086e-06, "loss": 1.1467, "step": 24336 }, { "epoch": 0.66, "learning_rate": 5.341265305810128e-06, "loss": 1.2078, "step": 24337 }, { "epoch": 0.66, "learning_rate": 5.340482666650394e-06, "loss": 1.2949, "step": 24338 }, { "epoch": 0.66, "learning_rate": 5.339700063944536e-06, "loss": 1.3167, "step": 24339 }, { "epoch": 0.66, "learning_rate": 5.338917497698674e-06, "loss": 1.2288, "step": 24340 }, { "epoch": 0.66, "learning_rate": 5.338134967918928e-06, "loss": 1.1437, "step": 24341 }, { "epoch": 0.66, "learning_rate": 5.337352474611421e-06, "loss": 1.2637, "step": 24342 }, { "epoch": 0.66, "learning_rate": 5.336570017782276e-06, "loss": 1.1628, "step": 24343 }, { "epoch": 0.66, "learning_rate": 5.3357875974376175e-06, "loss": 1.2087, "step": 24344 }, { "epoch": 0.66, "learning_rate": 5.3350052135835616e-06, "loss": 1.1003, "step": 24345 }, { "epoch": 0.66, "learning_rate": 5.334222866226228e-06, "loss": 1.7222, "step": 24346 }, { "epoch": 0.66, "learning_rate": 5.333440555371745e-06, "loss": 1.3965, "step": 24347 }, { "epoch": 0.66, "learning_rate": 5.332658281026229e-06, "loss": 1.2534, "step": 24348 }, { "epoch": 0.66, "learning_rate": 5.3318760431957935e-06, "loss": 1.2332, "step": 24349 }, { "epoch": 0.66, "learning_rate": 5.331093841886572e-06, "loss": 1.189, "step": 24350 }, { "epoch": 0.67, "learning_rate": 5.330311677104672e-06, "loss": 1.2219, "step": 24351 }, { "epoch": 0.67, "learning_rate": 5.329529548856224e-06, "loss": 1.158, "step": 24352 }, { "epoch": 0.67, "learning_rate": 5.328747457147333e-06, "loss": 1.2476, "step": 24353 }, { "epoch": 0.67, "learning_rate": 5.32796540198413e-06, "loss": 1.4246, "step": 24354 }, { "epoch": 0.67, "learning_rate": 5.327183383372725e-06, "loss": 1.332, "step": 24355 }, { "epoch": 0.67, "learning_rate": 5.3264014013192466e-06, "loss": 1.1033, "step": 24356 }, { "epoch": 0.67, "learning_rate": 5.325619455829798e-06, "loss": 1.375, "step": 24357 }, { "epoch": 0.67, "learning_rate": 5.32483754691051e-06, "loss": 1.2803, "step": 24358 }, { "epoch": 0.67, "learning_rate": 5.3240556745674895e-06, "loss": 1.269, "step": 24359 }, { "epoch": 0.67, "learning_rate": 5.323273838806868e-06, "loss": 1.1073, "step": 24360 }, { "epoch": 0.67, "learning_rate": 5.3224920396347435e-06, "loss": 1.4131, "step": 24361 }, { "epoch": 0.67, "learning_rate": 5.321710277057247e-06, "loss": 1.3542, "step": 24362 }, { "epoch": 0.67, "learning_rate": 5.320928551080484e-06, "loss": 1.2993, "step": 24363 }, { "epoch": 0.67, "learning_rate": 5.320146861710584e-06, "loss": 1.7202, "step": 24364 }, { "epoch": 0.67, "learning_rate": 5.319365208953648e-06, "loss": 1.2654, "step": 24365 }, { "epoch": 0.67, "learning_rate": 5.318583592815796e-06, "loss": 1.1765, "step": 24366 }, { "epoch": 0.67, "learning_rate": 5.317802013303149e-06, "loss": 1.2476, "step": 24367 }, { "epoch": 0.67, "learning_rate": 5.317020470421817e-06, "loss": 1.3328, "step": 24368 }, { "epoch": 0.67, "learning_rate": 5.316238964177915e-06, "loss": 1.3879, "step": 24369 }, { "epoch": 0.67, "learning_rate": 5.315457494577554e-06, "loss": 1.3762, "step": 24370 }, { "epoch": 0.67, "learning_rate": 5.314676061626853e-06, "loss": 1.2652, "step": 24371 }, { "epoch": 0.67, "learning_rate": 5.313894665331925e-06, "loss": 1.2239, "step": 24372 }, { "epoch": 0.67, "learning_rate": 5.31311330569888e-06, "loss": 1.2666, "step": 24373 }, { "epoch": 0.67, "learning_rate": 5.31233198273383e-06, "loss": 1.249, "step": 24374 }, { "epoch": 0.67, "learning_rate": 5.311550696442893e-06, "loss": 1.3896, "step": 24375 }, { "epoch": 0.67, "learning_rate": 5.310769446832178e-06, "loss": 1.2251, "step": 24376 }, { "epoch": 0.67, "learning_rate": 5.309988233907799e-06, "loss": 1.2434, "step": 24377 }, { "epoch": 0.67, "learning_rate": 5.309207057675862e-06, "loss": 1.1687, "step": 24378 }, { "epoch": 0.67, "learning_rate": 5.308425918142489e-06, "loss": 1.3936, "step": 24379 }, { "epoch": 0.67, "learning_rate": 5.307644815313784e-06, "loss": 1.2544, "step": 24380 }, { "epoch": 0.67, "learning_rate": 5.3068637491958565e-06, "loss": 1.2439, "step": 24381 }, { "epoch": 0.67, "learning_rate": 5.306082719794823e-06, "loss": 1.3164, "step": 24382 }, { "epoch": 0.67, "learning_rate": 5.305301727116791e-06, "loss": 1.4424, "step": 24383 }, { "epoch": 0.67, "learning_rate": 5.304520771167872e-06, "loss": 1.05, "step": 24384 }, { "epoch": 0.67, "learning_rate": 5.3037398519541695e-06, "loss": 1.1391, "step": 24385 }, { "epoch": 0.67, "learning_rate": 5.302958969481802e-06, "loss": 1.1589, "step": 24386 }, { "epoch": 0.67, "learning_rate": 5.302178123756876e-06, "loss": 1.3279, "step": 24387 }, { "epoch": 0.67, "learning_rate": 5.301397314785497e-06, "loss": 1.3132, "step": 24388 }, { "epoch": 0.67, "learning_rate": 5.300616542573773e-06, "loss": 1.3494, "step": 24389 }, { "epoch": 0.67, "learning_rate": 5.29983580712782e-06, "loss": 1.151, "step": 24390 }, { "epoch": 0.67, "learning_rate": 5.299055108453741e-06, "loss": 1.2371, "step": 24391 }, { "epoch": 0.67, "learning_rate": 5.298274446557645e-06, "loss": 1.2678, "step": 24392 }, { "epoch": 0.67, "learning_rate": 5.297493821445634e-06, "loss": 1.1245, "step": 24393 }, { "epoch": 0.67, "learning_rate": 5.296713233123825e-06, "loss": 1.321, "step": 24394 }, { "epoch": 0.67, "learning_rate": 5.295932681598319e-06, "loss": 1.2097, "step": 24395 }, { "epoch": 0.67, "learning_rate": 5.2951521668752206e-06, "loss": 1.2573, "step": 24396 }, { "epoch": 0.67, "learning_rate": 5.294371688960642e-06, "loss": 1.3486, "step": 24397 }, { "epoch": 0.67, "learning_rate": 5.2935912478606834e-06, "loss": 1.2417, "step": 24398 }, { "epoch": 0.67, "learning_rate": 5.292810843581462e-06, "loss": 1.2551, "step": 24399 }, { "epoch": 0.67, "learning_rate": 5.292030476129066e-06, "loss": 1.1797, "step": 24400 }, { "epoch": 0.67, "learning_rate": 5.291250145509615e-06, "loss": 1.2583, "step": 24401 }, { "epoch": 0.67, "learning_rate": 5.290469851729205e-06, "loss": 1.4009, "step": 24402 }, { "epoch": 0.67, "learning_rate": 5.289689594793951e-06, "loss": 1.3555, "step": 24403 }, { "epoch": 0.67, "learning_rate": 5.288909374709943e-06, "loss": 1.0012, "step": 24404 }, { "epoch": 0.67, "learning_rate": 5.288129191483297e-06, "loss": 1.1965, "step": 24405 }, { "epoch": 0.67, "learning_rate": 5.2873490451201085e-06, "loss": 1.2515, "step": 24406 }, { "epoch": 0.67, "learning_rate": 5.2865689356264884e-06, "loss": 1.217, "step": 24407 }, { "epoch": 0.67, "learning_rate": 5.285788863008537e-06, "loss": 1.3958, "step": 24408 }, { "epoch": 0.67, "learning_rate": 5.285008827272357e-06, "loss": 1.4092, "step": 24409 }, { "epoch": 0.67, "learning_rate": 5.284228828424046e-06, "loss": 1.2539, "step": 24410 }, { "epoch": 0.67, "learning_rate": 5.2834488664697155e-06, "loss": 1.1624, "step": 24411 }, { "epoch": 0.67, "learning_rate": 5.282668941415464e-06, "loss": 1.2388, "step": 24412 }, { "epoch": 0.67, "learning_rate": 5.281889053267388e-06, "loss": 1.3069, "step": 24413 }, { "epoch": 0.67, "learning_rate": 5.281109202031598e-06, "loss": 1.3196, "step": 24414 }, { "epoch": 0.67, "learning_rate": 5.2803293877141894e-06, "loss": 1.2976, "step": 24415 }, { "epoch": 0.67, "learning_rate": 5.279549610321264e-06, "loss": 1.2605, "step": 24416 }, { "epoch": 0.67, "learning_rate": 5.278769869858919e-06, "loss": 1.3481, "step": 24417 }, { "epoch": 0.67, "learning_rate": 5.2779901663332645e-06, "loss": 1.3123, "step": 24418 }, { "epoch": 0.67, "learning_rate": 5.2772104997503926e-06, "loss": 1.1528, "step": 24419 }, { "epoch": 0.67, "learning_rate": 5.276430870116405e-06, "loss": 1.24, "step": 24420 }, { "epoch": 0.67, "learning_rate": 5.275651277437398e-06, "loss": 1.2368, "step": 24421 }, { "epoch": 0.67, "learning_rate": 5.274871721719477e-06, "loss": 1.291, "step": 24422 }, { "epoch": 0.67, "learning_rate": 5.274092202968738e-06, "loss": 1.373, "step": 24423 }, { "epoch": 0.67, "learning_rate": 5.273312721191279e-06, "loss": 1.2446, "step": 24424 }, { "epoch": 0.67, "learning_rate": 5.272533276393196e-06, "loss": 1.1011, "step": 24425 }, { "epoch": 0.67, "learning_rate": 5.271753868580591e-06, "loss": 1.262, "step": 24426 }, { "epoch": 0.67, "learning_rate": 5.270974497759563e-06, "loss": 1.3784, "step": 24427 }, { "epoch": 0.67, "learning_rate": 5.270195163936203e-06, "loss": 1.2888, "step": 24428 }, { "epoch": 0.67, "learning_rate": 5.269415867116614e-06, "loss": 1.2708, "step": 24429 }, { "epoch": 0.67, "learning_rate": 5.268636607306892e-06, "loss": 1.2285, "step": 24430 }, { "epoch": 0.67, "learning_rate": 5.267857384513131e-06, "loss": 1.2327, "step": 24431 }, { "epoch": 0.67, "learning_rate": 5.2670781987414256e-06, "loss": 1.345, "step": 24432 }, { "epoch": 0.67, "learning_rate": 5.266299049997879e-06, "loss": 1.6392, "step": 24433 }, { "epoch": 0.67, "learning_rate": 5.2655199382885815e-06, "loss": 1.3699, "step": 24434 }, { "epoch": 0.67, "learning_rate": 5.26474086361963e-06, "loss": 1.4639, "step": 24435 }, { "epoch": 0.67, "learning_rate": 5.263961825997117e-06, "loss": 1.3438, "step": 24436 }, { "epoch": 0.67, "learning_rate": 5.263182825427142e-06, "loss": 1.1768, "step": 24437 }, { "epoch": 0.67, "learning_rate": 5.2624038619157935e-06, "loss": 1.1104, "step": 24438 }, { "epoch": 0.67, "learning_rate": 5.261624935469178e-06, "loss": 1.113, "step": 24439 }, { "epoch": 0.67, "learning_rate": 5.260846046093372e-06, "loss": 1.2566, "step": 24440 }, { "epoch": 0.67, "learning_rate": 5.260067193794483e-06, "loss": 0.9913, "step": 24441 }, { "epoch": 0.67, "learning_rate": 5.259288378578594e-06, "loss": 1.3213, "step": 24442 }, { "epoch": 0.67, "learning_rate": 5.258509600451809e-06, "loss": 1.3123, "step": 24443 }, { "epoch": 0.67, "learning_rate": 5.257730859420214e-06, "loss": 1.7134, "step": 24444 }, { "epoch": 0.67, "learning_rate": 5.256952155489901e-06, "loss": 1.2024, "step": 24445 }, { "epoch": 0.67, "learning_rate": 5.256173488666965e-06, "loss": 1.4602, "step": 24446 }, { "epoch": 0.67, "learning_rate": 5.255394858957499e-06, "loss": 1.7476, "step": 24447 }, { "epoch": 0.67, "learning_rate": 5.254616266367591e-06, "loss": 1.4226, "step": 24448 }, { "epoch": 0.67, "learning_rate": 5.253837710903331e-06, "loss": 1.229, "step": 24449 }, { "epoch": 0.67, "learning_rate": 5.253059192570817e-06, "loss": 1.2415, "step": 24450 }, { "epoch": 0.67, "learning_rate": 5.252280711376134e-06, "loss": 1.2319, "step": 24451 }, { "epoch": 0.67, "learning_rate": 5.251502267325377e-06, "loss": 1.3965, "step": 24452 }, { "epoch": 0.67, "learning_rate": 5.250723860424627e-06, "loss": 1.2053, "step": 24453 }, { "epoch": 0.67, "learning_rate": 5.249945490679986e-06, "loss": 1.3691, "step": 24454 }, { "epoch": 0.67, "learning_rate": 5.249167158097537e-06, "loss": 1.1531, "step": 24455 }, { "epoch": 0.67, "learning_rate": 5.24838886268337e-06, "loss": 1.3052, "step": 24456 }, { "epoch": 0.67, "learning_rate": 5.24761060444357e-06, "loss": 1.187, "step": 24457 }, { "epoch": 0.67, "learning_rate": 5.246832383384235e-06, "loss": 1.3665, "step": 24458 }, { "epoch": 0.67, "learning_rate": 5.246054199511448e-06, "loss": 1.3232, "step": 24459 }, { "epoch": 0.67, "learning_rate": 5.245276052831292e-06, "loss": 1.2153, "step": 24460 }, { "epoch": 0.67, "learning_rate": 5.244497943349866e-06, "loss": 1.3308, "step": 24461 }, { "epoch": 0.67, "learning_rate": 5.2437198710732515e-06, "loss": 1.2466, "step": 24462 }, { "epoch": 0.67, "learning_rate": 5.242941836007536e-06, "loss": 1.2107, "step": 24463 }, { "epoch": 0.67, "learning_rate": 5.2421638381588025e-06, "loss": 1.0769, "step": 24464 }, { "epoch": 0.67, "learning_rate": 5.241385877533145e-06, "loss": 1.0455, "step": 24465 }, { "epoch": 0.67, "learning_rate": 5.2406079541366486e-06, "loss": 1.7251, "step": 24466 }, { "epoch": 0.67, "learning_rate": 5.239830067975397e-06, "loss": 1.3706, "step": 24467 }, { "epoch": 0.67, "learning_rate": 5.239052219055471e-06, "loss": 1.1228, "step": 24468 }, { "epoch": 0.67, "learning_rate": 5.2382744073829685e-06, "loss": 1.3401, "step": 24469 }, { "epoch": 0.67, "learning_rate": 5.237496632963966e-06, "loss": 1.2532, "step": 24470 }, { "epoch": 0.67, "learning_rate": 5.23671889580455e-06, "loss": 1.165, "step": 24471 }, { "epoch": 0.67, "learning_rate": 5.235941195910803e-06, "loss": 1.2751, "step": 24472 }, { "epoch": 0.67, "learning_rate": 5.2351635332888095e-06, "loss": 1.4648, "step": 24473 }, { "epoch": 0.67, "learning_rate": 5.234385907944665e-06, "loss": 1.2446, "step": 24474 }, { "epoch": 0.67, "learning_rate": 5.2336083198844375e-06, "loss": 1.3774, "step": 24475 }, { "epoch": 0.67, "learning_rate": 5.232830769114221e-06, "loss": 1.1458, "step": 24476 }, { "epoch": 0.67, "learning_rate": 5.232053255640091e-06, "loss": 1.2859, "step": 24477 }, { "epoch": 0.67, "learning_rate": 5.231275779468141e-06, "loss": 1.3462, "step": 24478 }, { "epoch": 0.67, "learning_rate": 5.23049834060444e-06, "loss": 1.3369, "step": 24479 }, { "epoch": 0.67, "learning_rate": 5.22972093905508e-06, "loss": 1.2192, "step": 24480 }, { "epoch": 0.67, "learning_rate": 5.2289435748261366e-06, "loss": 1.2388, "step": 24481 }, { "epoch": 0.67, "learning_rate": 5.228166247923702e-06, "loss": 1.298, "step": 24482 }, { "epoch": 0.67, "learning_rate": 5.227388958353845e-06, "loss": 1.3809, "step": 24483 }, { "epoch": 0.67, "learning_rate": 5.226611706122656e-06, "loss": 1.3687, "step": 24484 }, { "epoch": 0.67, "learning_rate": 5.225834491236208e-06, "loss": 1.3865, "step": 24485 }, { "epoch": 0.67, "learning_rate": 5.225057313700594e-06, "loss": 1.3071, "step": 24486 }, { "epoch": 0.67, "learning_rate": 5.224280173521878e-06, "loss": 1.4565, "step": 24487 }, { "epoch": 0.67, "learning_rate": 5.223503070706153e-06, "loss": 1.2019, "step": 24488 }, { "epoch": 0.67, "learning_rate": 5.2227260052594904e-06, "loss": 1.168, "step": 24489 }, { "epoch": 0.67, "learning_rate": 5.221948977187976e-06, "loss": 1.2866, "step": 24490 }, { "epoch": 0.67, "learning_rate": 5.221171986497686e-06, "loss": 1.3479, "step": 24491 }, { "epoch": 0.67, "learning_rate": 5.2203950331946966e-06, "loss": 1.6768, "step": 24492 }, { "epoch": 0.67, "learning_rate": 5.2196181172850905e-06, "loss": 1.2319, "step": 24493 }, { "epoch": 0.67, "learning_rate": 5.218841238774945e-06, "loss": 1.3193, "step": 24494 }, { "epoch": 0.67, "learning_rate": 5.21806439767034e-06, "loss": 1.3757, "step": 24495 }, { "epoch": 0.67, "learning_rate": 5.217287593977344e-06, "loss": 1.3914, "step": 24496 }, { "epoch": 0.67, "learning_rate": 5.216510827702045e-06, "loss": 1.1377, "step": 24497 }, { "epoch": 0.67, "learning_rate": 5.215734098850516e-06, "loss": 1.2393, "step": 24498 }, { "epoch": 0.67, "learning_rate": 5.214957407428834e-06, "loss": 1.3892, "step": 24499 }, { "epoch": 0.67, "learning_rate": 5.214180753443072e-06, "loss": 1.2129, "step": 24500 }, { "epoch": 0.67, "learning_rate": 5.2134041368993115e-06, "loss": 1.4067, "step": 24501 }, { "epoch": 0.67, "learning_rate": 5.212627557803628e-06, "loss": 1.2722, "step": 24502 }, { "epoch": 0.67, "learning_rate": 5.211851016162095e-06, "loss": 1.144, "step": 24503 }, { "epoch": 0.67, "learning_rate": 5.211074511980782e-06, "loss": 1.6167, "step": 24504 }, { "epoch": 0.67, "learning_rate": 5.210298045265777e-06, "loss": 1.2793, "step": 24505 }, { "epoch": 0.67, "learning_rate": 5.209521616023146e-06, "loss": 1.1672, "step": 24506 }, { "epoch": 0.67, "learning_rate": 5.208745224258962e-06, "loss": 1.3098, "step": 24507 }, { "epoch": 0.67, "learning_rate": 5.207968869979308e-06, "loss": 1.2639, "step": 24508 }, { "epoch": 0.67, "learning_rate": 5.207192553190249e-06, "loss": 1.2388, "step": 24509 }, { "epoch": 0.67, "learning_rate": 5.206416273897863e-06, "loss": 1.437, "step": 24510 }, { "epoch": 0.67, "learning_rate": 5.205640032108218e-06, "loss": 1.2288, "step": 24511 }, { "epoch": 0.67, "learning_rate": 5.2048638278273954e-06, "loss": 1.272, "step": 24512 }, { "epoch": 0.67, "learning_rate": 5.204087661061463e-06, "loss": 1.0706, "step": 24513 }, { "epoch": 0.67, "learning_rate": 5.2033115318164926e-06, "loss": 1.1963, "step": 24514 }, { "epoch": 0.67, "learning_rate": 5.202535440098555e-06, "loss": 1.2195, "step": 24515 }, { "epoch": 0.67, "learning_rate": 5.201759385913727e-06, "loss": 1.3169, "step": 24516 }, { "epoch": 0.67, "learning_rate": 5.2009833692680774e-06, "loss": 1.2651, "step": 24517 }, { "epoch": 0.67, "learning_rate": 5.2002073901676775e-06, "loss": 1.5168, "step": 24518 }, { "epoch": 0.67, "learning_rate": 5.199431448618595e-06, "loss": 1.3096, "step": 24519 }, { "epoch": 0.67, "learning_rate": 5.198655544626901e-06, "loss": 1.2468, "step": 24520 }, { "epoch": 0.67, "learning_rate": 5.197879678198678e-06, "loss": 1.3406, "step": 24521 }, { "epoch": 0.67, "learning_rate": 5.197103849339978e-06, "loss": 1.2944, "step": 24522 }, { "epoch": 0.67, "learning_rate": 5.196328058056883e-06, "loss": 1.0984, "step": 24523 }, { "epoch": 0.67, "learning_rate": 5.1955523043554545e-06, "loss": 1.1042, "step": 24524 }, { "epoch": 0.67, "learning_rate": 5.194776588241774e-06, "loss": 1.2769, "step": 24525 }, { "epoch": 0.67, "learning_rate": 5.194000909721893e-06, "loss": 1.1973, "step": 24526 }, { "epoch": 0.67, "learning_rate": 5.193225268801894e-06, "loss": 1.4075, "step": 24527 }, { "epoch": 0.67, "learning_rate": 5.192449665487834e-06, "loss": 1.2415, "step": 24528 }, { "epoch": 0.67, "learning_rate": 5.1916740997857975e-06, "loss": 1.4038, "step": 24529 }, { "epoch": 0.67, "learning_rate": 5.190898571701833e-06, "loss": 1.2305, "step": 24530 }, { "epoch": 0.67, "learning_rate": 5.19012308124202e-06, "loss": 1.3647, "step": 24531 }, { "epoch": 0.67, "learning_rate": 5.189347628412419e-06, "loss": 1.3096, "step": 24532 }, { "epoch": 0.67, "learning_rate": 5.188572213219108e-06, "loss": 1.3962, "step": 24533 }, { "epoch": 0.67, "learning_rate": 5.187796835668137e-06, "loss": 1.1597, "step": 24534 }, { "epoch": 0.67, "learning_rate": 5.187021495765581e-06, "loss": 1.2678, "step": 24535 }, { "epoch": 0.67, "learning_rate": 5.18624619351751e-06, "loss": 1.2927, "step": 24536 }, { "epoch": 0.67, "learning_rate": 5.185470928929986e-06, "loss": 1.1589, "step": 24537 }, { "epoch": 0.67, "learning_rate": 5.18469570200907e-06, "loss": 1.2749, "step": 24538 }, { "epoch": 0.67, "learning_rate": 5.183920512760829e-06, "loss": 1.4255, "step": 24539 }, { "epoch": 0.67, "learning_rate": 5.183145361191334e-06, "loss": 1.2532, "step": 24540 }, { "epoch": 0.67, "learning_rate": 5.182370247306644e-06, "loss": 1.3145, "step": 24541 }, { "epoch": 0.67, "learning_rate": 5.181595171112823e-06, "loss": 1.1746, "step": 24542 }, { "epoch": 0.67, "learning_rate": 5.180820132615932e-06, "loss": 1.293, "step": 24543 }, { "epoch": 0.67, "learning_rate": 5.180045131822042e-06, "loss": 1.3496, "step": 24544 }, { "epoch": 0.67, "learning_rate": 5.179270168737214e-06, "loss": 1.3726, "step": 24545 }, { "epoch": 0.67, "learning_rate": 5.1784952433675075e-06, "loss": 1.2095, "step": 24546 }, { "epoch": 0.67, "learning_rate": 5.177720355718983e-06, "loss": 1.2209, "step": 24547 }, { "epoch": 0.67, "learning_rate": 5.1769455057977125e-06, "loss": 1.2456, "step": 24548 }, { "epoch": 0.67, "learning_rate": 5.17617069360975e-06, "loss": 1.2463, "step": 24549 }, { "epoch": 0.67, "learning_rate": 5.175395919161161e-06, "loss": 1.0463, "step": 24550 }, { "epoch": 0.67, "learning_rate": 5.174621182458002e-06, "loss": 1.2175, "step": 24551 }, { "epoch": 0.67, "learning_rate": 5.1738464835063415e-06, "loss": 1.5552, "step": 24552 }, { "epoch": 0.67, "learning_rate": 5.173071822312237e-06, "loss": 1.1902, "step": 24553 }, { "epoch": 0.67, "learning_rate": 5.172297198881744e-06, "loss": 1.2546, "step": 24554 }, { "epoch": 0.67, "learning_rate": 5.171522613220932e-06, "loss": 1.3096, "step": 24555 }, { "epoch": 0.67, "learning_rate": 5.170748065335856e-06, "loss": 1.3245, "step": 24556 }, { "epoch": 0.67, "learning_rate": 5.169973555232577e-06, "loss": 1.1938, "step": 24557 }, { "epoch": 0.67, "learning_rate": 5.169199082917149e-06, "loss": 1.3374, "step": 24558 }, { "epoch": 0.67, "learning_rate": 5.168424648395641e-06, "loss": 1.2202, "step": 24559 }, { "epoch": 0.67, "learning_rate": 5.167650251674106e-06, "loss": 1.4341, "step": 24560 }, { "epoch": 0.67, "learning_rate": 5.1668758927586025e-06, "loss": 1.2051, "step": 24561 }, { "epoch": 0.67, "learning_rate": 5.166101571655185e-06, "loss": 1.377, "step": 24562 }, { "epoch": 0.67, "learning_rate": 5.1653272883699215e-06, "loss": 1.1685, "step": 24563 }, { "epoch": 0.67, "learning_rate": 5.164553042908862e-06, "loss": 1.1514, "step": 24564 }, { "epoch": 0.67, "learning_rate": 5.163778835278066e-06, "loss": 1.2808, "step": 24565 }, { "epoch": 0.67, "learning_rate": 5.163004665483588e-06, "loss": 1.4414, "step": 24566 }, { "epoch": 0.67, "learning_rate": 5.162230533531485e-06, "loss": 1.3728, "step": 24567 }, { "epoch": 0.67, "learning_rate": 5.161456439427823e-06, "loss": 1.3484, "step": 24568 }, { "epoch": 0.67, "learning_rate": 5.160682383178646e-06, "loss": 1.2693, "step": 24569 }, { "epoch": 0.67, "learning_rate": 5.159908364790015e-06, "loss": 1.2915, "step": 24570 }, { "epoch": 0.67, "learning_rate": 5.159134384267982e-06, "loss": 1.3127, "step": 24571 }, { "epoch": 0.67, "learning_rate": 5.158360441618613e-06, "loss": 1.3081, "step": 24572 }, { "epoch": 0.67, "learning_rate": 5.157586536847948e-06, "loss": 1.2588, "step": 24573 }, { "epoch": 0.67, "learning_rate": 5.156812669962053e-06, "loss": 1.2996, "step": 24574 }, { "epoch": 0.67, "learning_rate": 5.1560388409669725e-06, "loss": 1.1436, "step": 24575 }, { "epoch": 0.67, "learning_rate": 5.1552650498687765e-06, "loss": 1.3667, "step": 24576 }, { "epoch": 0.67, "learning_rate": 5.1544912966735e-06, "loss": 1.2747, "step": 24577 }, { "epoch": 0.67, "learning_rate": 5.153717581387207e-06, "loss": 1.2747, "step": 24578 }, { "epoch": 0.67, "learning_rate": 5.152943904015948e-06, "loss": 1.1765, "step": 24579 }, { "epoch": 0.67, "learning_rate": 5.1521702645657825e-06, "loss": 1.3262, "step": 24580 }, { "epoch": 0.67, "learning_rate": 5.1513966630427495e-06, "loss": 1.4058, "step": 24581 }, { "epoch": 0.67, "learning_rate": 5.15062309945291e-06, "loss": 1.2473, "step": 24582 }, { "epoch": 0.67, "learning_rate": 5.149849573802319e-06, "loss": 1.3403, "step": 24583 }, { "epoch": 0.67, "learning_rate": 5.149076086097022e-06, "loss": 1.3647, "step": 24584 }, { "epoch": 0.67, "learning_rate": 5.148302636343075e-06, "loss": 1.3259, "step": 24585 }, { "epoch": 0.67, "learning_rate": 5.147529224546522e-06, "loss": 1.2849, "step": 24586 }, { "epoch": 0.67, "learning_rate": 5.146755850713423e-06, "loss": 1.2095, "step": 24587 }, { "epoch": 0.67, "learning_rate": 5.145982514849823e-06, "loss": 1.155, "step": 24588 }, { "epoch": 0.67, "learning_rate": 5.145209216961775e-06, "loss": 1.3794, "step": 24589 }, { "epoch": 0.67, "learning_rate": 5.1444359570553215e-06, "loss": 1.2209, "step": 24590 }, { "epoch": 0.67, "learning_rate": 5.1436627351365235e-06, "loss": 1.1836, "step": 24591 }, { "epoch": 0.67, "learning_rate": 5.142889551211423e-06, "loss": 1.3379, "step": 24592 }, { "epoch": 0.67, "learning_rate": 5.1421164052860705e-06, "loss": 1.3025, "step": 24593 }, { "epoch": 0.67, "learning_rate": 5.141343297366512e-06, "loss": 1.1804, "step": 24594 }, { "epoch": 0.67, "learning_rate": 5.140570227458803e-06, "loss": 1.3418, "step": 24595 }, { "epoch": 0.67, "learning_rate": 5.139797195568987e-06, "loss": 1.1545, "step": 24596 }, { "epoch": 0.67, "learning_rate": 5.139024201703108e-06, "loss": 1.3013, "step": 24597 }, { "epoch": 0.67, "learning_rate": 5.138251245867223e-06, "loss": 1.3091, "step": 24598 }, { "epoch": 0.67, "learning_rate": 5.137478328067373e-06, "loss": 1.0625, "step": 24599 }, { "epoch": 0.67, "learning_rate": 5.1367054483096055e-06, "loss": 1.2749, "step": 24600 }, { "epoch": 0.67, "learning_rate": 5.135932606599965e-06, "loss": 1.1381, "step": 24601 }, { "epoch": 0.67, "learning_rate": 5.135159802944504e-06, "loss": 1.334, "step": 24602 }, { "epoch": 0.67, "learning_rate": 5.1343870373492645e-06, "loss": 1.199, "step": 24603 }, { "epoch": 0.67, "learning_rate": 5.133614309820294e-06, "loss": 1.2732, "step": 24604 }, { "epoch": 0.67, "learning_rate": 5.132841620363632e-06, "loss": 1.342, "step": 24605 }, { "epoch": 0.67, "learning_rate": 5.132068968985333e-06, "loss": 1.1572, "step": 24606 }, { "epoch": 0.67, "learning_rate": 5.131296355691437e-06, "loss": 1.3621, "step": 24607 }, { "epoch": 0.67, "learning_rate": 5.130523780487989e-06, "loss": 1.6787, "step": 24608 }, { "epoch": 0.67, "learning_rate": 5.129751243381029e-06, "loss": 1.377, "step": 24609 }, { "epoch": 0.67, "learning_rate": 5.128978744376609e-06, "loss": 1.2383, "step": 24610 }, { "epoch": 0.67, "learning_rate": 5.12820628348077e-06, "loss": 1.2642, "step": 24611 }, { "epoch": 0.67, "learning_rate": 5.127433860699553e-06, "loss": 1.3643, "step": 24612 }, { "epoch": 0.67, "learning_rate": 5.126661476038999e-06, "loss": 1.3843, "step": 24613 }, { "epoch": 0.67, "learning_rate": 5.125889129505153e-06, "loss": 1.2097, "step": 24614 }, { "epoch": 0.67, "learning_rate": 5.125116821104066e-06, "loss": 1.4087, "step": 24615 }, { "epoch": 0.67, "learning_rate": 5.124344550841766e-06, "loss": 1.3479, "step": 24616 }, { "epoch": 0.67, "learning_rate": 5.123572318724306e-06, "loss": 1.199, "step": 24617 }, { "epoch": 0.67, "learning_rate": 5.122800124757718e-06, "loss": 1.323, "step": 24618 }, { "epoch": 0.67, "learning_rate": 5.122027968948055e-06, "loss": 1.3579, "step": 24619 }, { "epoch": 0.67, "learning_rate": 5.121255851301345e-06, "loss": 1.3574, "step": 24620 }, { "epoch": 0.67, "learning_rate": 5.12048377182364e-06, "loss": 1.3269, "step": 24621 }, { "epoch": 0.67, "learning_rate": 5.119711730520971e-06, "loss": 1.3325, "step": 24622 }, { "epoch": 0.67, "learning_rate": 5.1189397273993905e-06, "loss": 1.3904, "step": 24623 }, { "epoch": 0.67, "learning_rate": 5.11816776246492e-06, "loss": 1.2881, "step": 24624 }, { "epoch": 0.67, "learning_rate": 5.117395835723617e-06, "loss": 1.1975, "step": 24625 }, { "epoch": 0.67, "learning_rate": 5.116623947181507e-06, "loss": 1.4736, "step": 24626 }, { "epoch": 0.67, "learning_rate": 5.115852096844642e-06, "loss": 1.3267, "step": 24627 }, { "epoch": 0.67, "learning_rate": 5.1150802847190475e-06, "loss": 1.1282, "step": 24628 }, { "epoch": 0.67, "learning_rate": 5.114308510810768e-06, "loss": 1.2839, "step": 24629 }, { "epoch": 0.67, "learning_rate": 5.113536775125843e-06, "loss": 1.1057, "step": 24630 }, { "epoch": 0.67, "learning_rate": 5.1127650776703095e-06, "loss": 1.3867, "step": 24631 }, { "epoch": 0.67, "learning_rate": 5.111993418450205e-06, "loss": 1.3467, "step": 24632 }, { "epoch": 0.67, "learning_rate": 5.1112217974715615e-06, "loss": 1.1958, "step": 24633 }, { "epoch": 0.67, "learning_rate": 5.1104502147404225e-06, "loss": 1.3027, "step": 24634 }, { "epoch": 0.67, "learning_rate": 5.109678670262822e-06, "loss": 1.3452, "step": 24635 }, { "epoch": 0.67, "learning_rate": 5.108907164044797e-06, "loss": 1.3765, "step": 24636 }, { "epoch": 0.67, "learning_rate": 5.1081356960923776e-06, "loss": 1.7031, "step": 24637 }, { "epoch": 0.67, "learning_rate": 5.107364266411607e-06, "loss": 1.1677, "step": 24638 }, { "epoch": 0.67, "learning_rate": 5.10659287500852e-06, "loss": 1.3613, "step": 24639 }, { "epoch": 0.67, "learning_rate": 5.105821521889147e-06, "loss": 1.1946, "step": 24640 }, { "epoch": 0.67, "learning_rate": 5.1050502070595235e-06, "loss": 1.2109, "step": 24641 }, { "epoch": 0.67, "learning_rate": 5.104278930525688e-06, "loss": 1.3887, "step": 24642 }, { "epoch": 0.67, "learning_rate": 5.103507692293672e-06, "loss": 1.3315, "step": 24643 }, { "epoch": 0.67, "learning_rate": 5.1027364923695055e-06, "loss": 1.416, "step": 24644 }, { "epoch": 0.67, "learning_rate": 5.10196533075923e-06, "loss": 1.6733, "step": 24645 }, { "epoch": 0.67, "learning_rate": 5.101194207468874e-06, "loss": 1.197, "step": 24646 }, { "epoch": 0.67, "learning_rate": 5.100423122504472e-06, "loss": 1.1882, "step": 24647 }, { "epoch": 0.67, "learning_rate": 5.0996520758720505e-06, "loss": 1.2048, "step": 24648 }, { "epoch": 0.67, "learning_rate": 5.0988810675776515e-06, "loss": 1.1907, "step": 24649 }, { "epoch": 0.67, "learning_rate": 5.0981100976273025e-06, "loss": 1.2949, "step": 24650 }, { "epoch": 0.67, "learning_rate": 5.097339166027033e-06, "loss": 1.2212, "step": 24651 }, { "epoch": 0.67, "learning_rate": 5.096568272782876e-06, "loss": 1.3652, "step": 24652 }, { "epoch": 0.67, "learning_rate": 5.095797417900865e-06, "loss": 1.1335, "step": 24653 }, { "epoch": 0.67, "learning_rate": 5.095026601387028e-06, "loss": 1.1572, "step": 24654 }, { "epoch": 0.67, "learning_rate": 5.094255823247398e-06, "loss": 1.2085, "step": 24655 }, { "epoch": 0.67, "learning_rate": 5.093485083487999e-06, "loss": 1.2295, "step": 24656 }, { "epoch": 0.67, "learning_rate": 5.09271438211487e-06, "loss": 1.4065, "step": 24657 }, { "epoch": 0.67, "learning_rate": 5.0919437191340355e-06, "loss": 1.2354, "step": 24658 }, { "epoch": 0.67, "learning_rate": 5.0911730945515214e-06, "loss": 1.3235, "step": 24659 }, { "epoch": 0.67, "learning_rate": 5.090402508373364e-06, "loss": 1.2983, "step": 24660 }, { "epoch": 0.67, "learning_rate": 5.0896319606055865e-06, "loss": 1.3359, "step": 24661 }, { "epoch": 0.67, "learning_rate": 5.0888614512542265e-06, "loss": 1.2578, "step": 24662 }, { "epoch": 0.67, "learning_rate": 5.0880909803252974e-06, "loss": 1.271, "step": 24663 }, { "epoch": 0.67, "learning_rate": 5.087320547824839e-06, "loss": 1.2231, "step": 24664 }, { "epoch": 0.67, "learning_rate": 5.086550153758869e-06, "loss": 1.335, "step": 24665 }, { "epoch": 0.67, "learning_rate": 5.08577979813343e-06, "loss": 1.3137, "step": 24666 }, { "epoch": 0.67, "learning_rate": 5.08500948095453e-06, "loss": 1.2844, "step": 24667 }, { "epoch": 0.67, "learning_rate": 5.084239202228209e-06, "loss": 1.333, "step": 24668 }, { "epoch": 0.67, "learning_rate": 5.083468961960485e-06, "loss": 1.3318, "step": 24669 }, { "epoch": 0.67, "learning_rate": 5.082698760157392e-06, "loss": 1.335, "step": 24670 }, { "epoch": 0.67, "learning_rate": 5.081928596824951e-06, "loss": 1.1462, "step": 24671 }, { "epoch": 0.67, "learning_rate": 5.081158471969189e-06, "loss": 1.2573, "step": 24672 }, { "epoch": 0.67, "learning_rate": 5.080388385596124e-06, "loss": 1.4023, "step": 24673 }, { "epoch": 0.67, "learning_rate": 5.0796183377117935e-06, "loss": 1.3125, "step": 24674 }, { "epoch": 0.67, "learning_rate": 5.078848328322214e-06, "loss": 1.3203, "step": 24675 }, { "epoch": 0.67, "learning_rate": 5.078078357433408e-06, "loss": 1.2629, "step": 24676 }, { "epoch": 0.67, "learning_rate": 5.077308425051406e-06, "loss": 1.1113, "step": 24677 }, { "epoch": 0.67, "learning_rate": 5.076538531182228e-06, "loss": 1.251, "step": 24678 }, { "epoch": 0.67, "learning_rate": 5.075768675831897e-06, "loss": 1.3699, "step": 24679 }, { "epoch": 0.67, "learning_rate": 5.074998859006432e-06, "loss": 1.7295, "step": 24680 }, { "epoch": 0.67, "learning_rate": 5.074229080711865e-06, "loss": 1.2195, "step": 24681 }, { "epoch": 0.67, "learning_rate": 5.073459340954214e-06, "loss": 1.2861, "step": 24682 }, { "epoch": 0.67, "learning_rate": 5.072689639739499e-06, "loss": 1.1675, "step": 24683 }, { "epoch": 0.67, "learning_rate": 5.071919977073741e-06, "loss": 1.2275, "step": 24684 }, { "epoch": 0.67, "learning_rate": 5.071150352962966e-06, "loss": 1.2617, "step": 24685 }, { "epoch": 0.67, "learning_rate": 5.070380767413194e-06, "loss": 1.2466, "step": 24686 }, { "epoch": 0.67, "learning_rate": 5.069611220430444e-06, "loss": 1.2485, "step": 24687 }, { "epoch": 0.67, "learning_rate": 5.068841712020733e-06, "loss": 1.2117, "step": 24688 }, { "epoch": 0.67, "learning_rate": 5.068072242190091e-06, "loss": 1.2881, "step": 24689 }, { "epoch": 0.67, "learning_rate": 5.067302810944532e-06, "loss": 1.3647, "step": 24690 }, { "epoch": 0.67, "learning_rate": 5.066533418290072e-06, "loss": 1.283, "step": 24691 }, { "epoch": 0.67, "learning_rate": 5.065764064232739e-06, "loss": 1.1838, "step": 24692 }, { "epoch": 0.67, "learning_rate": 5.064994748778548e-06, "loss": 1.1594, "step": 24693 }, { "epoch": 0.67, "learning_rate": 5.064225471933517e-06, "loss": 1.2368, "step": 24694 }, { "epoch": 0.67, "learning_rate": 5.063456233703661e-06, "loss": 1.324, "step": 24695 }, { "epoch": 0.67, "learning_rate": 5.062687034095007e-06, "loss": 1.4321, "step": 24696 }, { "epoch": 0.67, "learning_rate": 5.0619178731135665e-06, "loss": 1.2266, "step": 24697 }, { "epoch": 0.67, "learning_rate": 5.061148750765359e-06, "loss": 1.3503, "step": 24698 }, { "epoch": 0.67, "learning_rate": 5.060379667056399e-06, "loss": 1.3477, "step": 24699 }, { "epoch": 0.67, "learning_rate": 5.0596106219927075e-06, "loss": 1.2827, "step": 24700 }, { "epoch": 0.67, "learning_rate": 5.058841615580295e-06, "loss": 1.4153, "step": 24701 }, { "epoch": 0.67, "learning_rate": 5.058072647825192e-06, "loss": 1.2422, "step": 24702 }, { "epoch": 0.67, "learning_rate": 5.057303718733395e-06, "loss": 1.1753, "step": 24703 }, { "epoch": 0.67, "learning_rate": 5.056534828310935e-06, "loss": 1.2542, "step": 24704 }, { "epoch": 0.67, "learning_rate": 5.0557659765638175e-06, "loss": 1.252, "step": 24705 }, { "epoch": 0.67, "learning_rate": 5.054997163498065e-06, "loss": 1.3333, "step": 24706 }, { "epoch": 0.67, "learning_rate": 5.054228389119691e-06, "loss": 1.2861, "step": 24707 }, { "epoch": 0.67, "learning_rate": 5.053459653434705e-06, "loss": 1.3101, "step": 24708 }, { "epoch": 0.67, "learning_rate": 5.052690956449126e-06, "loss": 1.1975, "step": 24709 }, { "epoch": 0.67, "learning_rate": 5.051922298168969e-06, "loss": 1.2727, "step": 24710 }, { "epoch": 0.67, "learning_rate": 5.051153678600244e-06, "loss": 1.3223, "step": 24711 }, { "epoch": 0.67, "learning_rate": 5.050385097748962e-06, "loss": 1.1487, "step": 24712 }, { "epoch": 0.67, "learning_rate": 5.049616555621142e-06, "loss": 1.332, "step": 24713 }, { "epoch": 0.67, "learning_rate": 5.048848052222797e-06, "loss": 1.2717, "step": 24714 }, { "epoch": 0.67, "learning_rate": 5.048079587559934e-06, "loss": 1.0581, "step": 24715 }, { "epoch": 0.67, "learning_rate": 5.047311161638565e-06, "loss": 1.2915, "step": 24716 }, { "epoch": 0.68, "learning_rate": 5.046542774464709e-06, "loss": 1.4521, "step": 24717 }, { "epoch": 0.68, "learning_rate": 5.045774426044372e-06, "loss": 1.1902, "step": 24718 }, { "epoch": 0.68, "learning_rate": 5.045006116383566e-06, "loss": 1.1611, "step": 24719 }, { "epoch": 0.68, "learning_rate": 5.044237845488299e-06, "loss": 1.4556, "step": 24720 }, { "epoch": 0.68, "learning_rate": 5.043469613364589e-06, "loss": 1.1362, "step": 24721 }, { "epoch": 0.68, "learning_rate": 5.042701420018441e-06, "loss": 1.1924, "step": 24722 }, { "epoch": 0.68, "learning_rate": 5.041933265455863e-06, "loss": 1.2236, "step": 24723 }, { "epoch": 0.68, "learning_rate": 5.041165149682872e-06, "loss": 1.3315, "step": 24724 }, { "epoch": 0.68, "learning_rate": 5.040397072705472e-06, "loss": 1.7109, "step": 24725 }, { "epoch": 0.68, "learning_rate": 5.039629034529673e-06, "loss": 1.3845, "step": 24726 }, { "epoch": 0.68, "learning_rate": 5.03886103516148e-06, "loss": 1.3362, "step": 24727 }, { "epoch": 0.68, "learning_rate": 5.03809307460691e-06, "loss": 1.2329, "step": 24728 }, { "epoch": 0.68, "learning_rate": 5.037325152871966e-06, "loss": 1.3821, "step": 24729 }, { "epoch": 0.68, "learning_rate": 5.036557269962656e-06, "loss": 1.3792, "step": 24730 }, { "epoch": 0.68, "learning_rate": 5.0357894258849845e-06, "loss": 1.2593, "step": 24731 }, { "epoch": 0.68, "learning_rate": 5.035021620644967e-06, "loss": 1.1167, "step": 24732 }, { "epoch": 0.68, "learning_rate": 5.034253854248605e-06, "loss": 1.4292, "step": 24733 }, { "epoch": 0.68, "learning_rate": 5.033486126701905e-06, "loss": 1.3237, "step": 24734 }, { "epoch": 0.68, "learning_rate": 5.032718438010872e-06, "loss": 1.356, "step": 24735 }, { "epoch": 0.68, "learning_rate": 5.031950788181517e-06, "loss": 1.3306, "step": 24736 }, { "epoch": 0.68, "learning_rate": 5.031183177219843e-06, "loss": 1.3572, "step": 24737 }, { "epoch": 0.68, "learning_rate": 5.030415605131851e-06, "loss": 1.2314, "step": 24738 }, { "epoch": 0.68, "learning_rate": 5.029648071923554e-06, "loss": 1.2444, "step": 24739 }, { "epoch": 0.68, "learning_rate": 5.028880577600951e-06, "loss": 1.1306, "step": 24740 }, { "epoch": 0.68, "learning_rate": 5.0281131221700556e-06, "loss": 1.3047, "step": 24741 }, { "epoch": 0.68, "learning_rate": 5.027345705636857e-06, "loss": 1.2764, "step": 24742 }, { "epoch": 0.68, "learning_rate": 5.026578328007372e-06, "loss": 1.2153, "step": 24743 }, { "epoch": 0.68, "learning_rate": 5.025810989287594e-06, "loss": 1.2429, "step": 24744 }, { "epoch": 0.68, "learning_rate": 5.025043689483542e-06, "loss": 1.1692, "step": 24745 }, { "epoch": 0.68, "learning_rate": 5.024276428601199e-06, "loss": 1.2114, "step": 24746 }, { "epoch": 0.68, "learning_rate": 5.023509206646582e-06, "loss": 1.2134, "step": 24747 }, { "epoch": 0.68, "learning_rate": 5.022742023625685e-06, "loss": 1.3115, "step": 24748 }, { "epoch": 0.68, "learning_rate": 5.021974879544522e-06, "loss": 1.3252, "step": 24749 }, { "epoch": 0.68, "learning_rate": 5.021207774409078e-06, "loss": 1.2693, "step": 24750 }, { "epoch": 0.68, "learning_rate": 5.020440708225369e-06, "loss": 1.2207, "step": 24751 }, { "epoch": 0.68, "learning_rate": 5.019673680999384e-06, "loss": 1.1028, "step": 24752 }, { "epoch": 0.68, "learning_rate": 5.018906692737135e-06, "loss": 1.2842, "step": 24753 }, { "epoch": 0.68, "learning_rate": 5.018139743444619e-06, "loss": 1.2095, "step": 24754 }, { "epoch": 0.68, "learning_rate": 5.0173728331278304e-06, "loss": 1.3535, "step": 24755 }, { "epoch": 0.68, "learning_rate": 5.016605961792777e-06, "loss": 1.2646, "step": 24756 }, { "epoch": 0.68, "learning_rate": 5.015839129445457e-06, "loss": 1.1836, "step": 24757 }, { "epoch": 0.68, "learning_rate": 5.015072336091866e-06, "loss": 1.2466, "step": 24758 }, { "epoch": 0.68, "learning_rate": 5.014305581738001e-06, "loss": 1.2632, "step": 24759 }, { "epoch": 0.68, "learning_rate": 5.013538866389869e-06, "loss": 1.2357, "step": 24760 }, { "epoch": 0.68, "learning_rate": 5.012772190053465e-06, "loss": 1.2137, "step": 24761 }, { "epoch": 0.68, "learning_rate": 5.012005552734785e-06, "loss": 1.1982, "step": 24762 }, { "epoch": 0.68, "learning_rate": 5.011238954439825e-06, "loss": 1.2495, "step": 24763 }, { "epoch": 0.68, "learning_rate": 5.010472395174589e-06, "loss": 1.0686, "step": 24764 }, { "epoch": 0.68, "learning_rate": 5.0097058749450715e-06, "loss": 1.2917, "step": 24765 }, { "epoch": 0.68, "learning_rate": 5.008939393757268e-06, "loss": 1.2328, "step": 24766 }, { "epoch": 0.68, "learning_rate": 5.0081729516171715e-06, "loss": 1.2607, "step": 24767 }, { "epoch": 0.68, "learning_rate": 5.0074065485307866e-06, "loss": 1.2112, "step": 24768 }, { "epoch": 0.68, "learning_rate": 5.0066401845041054e-06, "loss": 1.1929, "step": 24769 }, { "epoch": 0.68, "learning_rate": 5.00587385954312e-06, "loss": 1.2693, "step": 24770 }, { "epoch": 0.68, "learning_rate": 5.0051075736538315e-06, "loss": 1.2671, "step": 24771 }, { "epoch": 0.68, "learning_rate": 5.004341326842234e-06, "loss": 1.1855, "step": 24772 }, { "epoch": 0.68, "learning_rate": 5.00357511911432e-06, "loss": 1.311, "step": 24773 }, { "epoch": 0.68, "learning_rate": 5.002808950476081e-06, "loss": 1.3853, "step": 24774 }, { "epoch": 0.68, "learning_rate": 5.002042820933519e-06, "loss": 1.2539, "step": 24775 }, { "epoch": 0.68, "learning_rate": 5.001276730492623e-06, "loss": 1.2278, "step": 24776 }, { "epoch": 0.68, "learning_rate": 5.00051067915939e-06, "loss": 1.2751, "step": 24777 }, { "epoch": 0.68, "learning_rate": 4.999744666939804e-06, "loss": 1.3513, "step": 24778 }, { "epoch": 0.68, "learning_rate": 4.998978693839869e-06, "loss": 1.812, "step": 24779 }, { "epoch": 0.68, "learning_rate": 4.998212759865573e-06, "loss": 1.1567, "step": 24780 }, { "epoch": 0.68, "learning_rate": 4.997446865022909e-06, "loss": 1.4136, "step": 24781 }, { "epoch": 0.68, "learning_rate": 4.996681009317864e-06, "loss": 1.3896, "step": 24782 }, { "epoch": 0.68, "learning_rate": 4.995915192756434e-06, "loss": 1.2302, "step": 24783 }, { "epoch": 0.68, "learning_rate": 4.995149415344618e-06, "loss": 1.355, "step": 24784 }, { "epoch": 0.68, "learning_rate": 4.994383677088392e-06, "loss": 0.9481, "step": 24785 }, { "epoch": 0.68, "learning_rate": 4.993617977993758e-06, "loss": 1.3403, "step": 24786 }, { "epoch": 0.68, "learning_rate": 4.992852318066699e-06, "loss": 1.2185, "step": 24787 }, { "epoch": 0.68, "learning_rate": 4.992086697313216e-06, "loss": 1.3342, "step": 24788 }, { "epoch": 0.68, "learning_rate": 4.991321115739286e-06, "loss": 1.1963, "step": 24789 }, { "epoch": 0.68, "learning_rate": 4.990555573350907e-06, "loss": 1.3596, "step": 24790 }, { "epoch": 0.68, "learning_rate": 4.9897900701540616e-06, "loss": 1.2578, "step": 24791 }, { "epoch": 0.68, "learning_rate": 4.989024606154751e-06, "loss": 1.2803, "step": 24792 }, { "epoch": 0.68, "learning_rate": 4.9882591813589465e-06, "loss": 1.4316, "step": 24793 }, { "epoch": 0.68, "learning_rate": 4.987493795772651e-06, "loss": 1.2598, "step": 24794 }, { "epoch": 0.68, "learning_rate": 4.986728449401842e-06, "loss": 1.2261, "step": 24795 }, { "epoch": 0.68, "learning_rate": 4.98596314225252e-06, "loss": 1.2264, "step": 24796 }, { "epoch": 0.68, "learning_rate": 4.985197874330657e-06, "loss": 1.2993, "step": 24797 }, { "epoch": 0.68, "learning_rate": 4.984432645642252e-06, "loss": 1.1619, "step": 24798 }, { "epoch": 0.68, "learning_rate": 4.983667456193284e-06, "loss": 1.3877, "step": 24799 }, { "epoch": 0.68, "learning_rate": 4.9829023059897465e-06, "loss": 1.4058, "step": 24800 }, { "epoch": 0.68, "learning_rate": 4.9821371950376214e-06, "loss": 1.3474, "step": 24801 }, { "epoch": 0.68, "learning_rate": 4.9813721233428926e-06, "loss": 1.1614, "step": 24802 }, { "epoch": 0.68, "learning_rate": 4.980607090911551e-06, "loss": 1.3855, "step": 24803 }, { "epoch": 0.68, "learning_rate": 4.97984209774958e-06, "loss": 1.312, "step": 24804 }, { "epoch": 0.68, "learning_rate": 4.979077143862964e-06, "loss": 1.3577, "step": 24805 }, { "epoch": 0.68, "learning_rate": 4.978312229257682e-06, "loss": 1.2581, "step": 24806 }, { "epoch": 0.68, "learning_rate": 4.977547353939729e-06, "loss": 1.4158, "step": 24807 }, { "epoch": 0.68, "learning_rate": 4.976782517915084e-06, "loss": 1.2297, "step": 24808 }, { "epoch": 0.68, "learning_rate": 4.97601772118973e-06, "loss": 1.2605, "step": 24809 }, { "epoch": 0.68, "learning_rate": 4.9752529637696465e-06, "loss": 1.1587, "step": 24810 }, { "epoch": 0.68, "learning_rate": 4.9744882456608255e-06, "loss": 1.1323, "step": 24811 }, { "epoch": 0.68, "learning_rate": 4.973723566869246e-06, "loss": 1.2511, "step": 24812 }, { "epoch": 0.68, "learning_rate": 4.972958927400889e-06, "loss": 1.2634, "step": 24813 }, { "epoch": 0.68, "learning_rate": 4.972194327261733e-06, "loss": 1.196, "step": 24814 }, { "epoch": 0.68, "learning_rate": 4.971429766457769e-06, "loss": 1.3108, "step": 24815 }, { "epoch": 0.68, "learning_rate": 4.970665244994974e-06, "loss": 1.1255, "step": 24816 }, { "epoch": 0.68, "learning_rate": 4.969900762879325e-06, "loss": 1.3074, "step": 24817 }, { "epoch": 0.68, "learning_rate": 4.969136320116812e-06, "loss": 1.3833, "step": 24818 }, { "epoch": 0.68, "learning_rate": 4.968371916713409e-06, "loss": 1.2144, "step": 24819 }, { "epoch": 0.68, "learning_rate": 4.967607552675099e-06, "loss": 1.1653, "step": 24820 }, { "epoch": 0.68, "learning_rate": 4.966843228007857e-06, "loss": 1.1115, "step": 24821 }, { "epoch": 0.68, "learning_rate": 4.966078942717671e-06, "loss": 1.2825, "step": 24822 }, { "epoch": 0.68, "learning_rate": 4.965314696810516e-06, "loss": 1.209, "step": 24823 }, { "epoch": 0.68, "learning_rate": 4.964550490292372e-06, "loss": 1.2581, "step": 24824 }, { "epoch": 0.68, "learning_rate": 4.963786323169213e-06, "loss": 1.2495, "step": 24825 }, { "epoch": 0.68, "learning_rate": 4.963022195447025e-06, "loss": 1.1648, "step": 24826 }, { "epoch": 0.68, "learning_rate": 4.962258107131782e-06, "loss": 1.2764, "step": 24827 }, { "epoch": 0.68, "learning_rate": 4.961494058229465e-06, "loss": 1.1289, "step": 24828 }, { "epoch": 0.68, "learning_rate": 4.960730048746043e-06, "loss": 1.2024, "step": 24829 }, { "epoch": 0.68, "learning_rate": 4.9599660786875e-06, "loss": 1.7573, "step": 24830 }, { "epoch": 0.68, "learning_rate": 4.959202148059822e-06, "loss": 1.2197, "step": 24831 }, { "epoch": 0.68, "learning_rate": 4.958438256868966e-06, "loss": 1.3428, "step": 24832 }, { "epoch": 0.68, "learning_rate": 4.9576744051209235e-06, "loss": 1.3696, "step": 24833 }, { "epoch": 0.68, "learning_rate": 4.956910592821661e-06, "loss": 1.3667, "step": 24834 }, { "epoch": 0.68, "learning_rate": 4.956146819977166e-06, "loss": 1.2947, "step": 24835 }, { "epoch": 0.68, "learning_rate": 4.9553830865934e-06, "loss": 1.3289, "step": 24836 }, { "epoch": 0.68, "learning_rate": 4.954619392676347e-06, "loss": 1.2729, "step": 24837 }, { "epoch": 0.68, "learning_rate": 4.953855738231976e-06, "loss": 1.3499, "step": 24838 }, { "epoch": 0.68, "learning_rate": 4.953092123266273e-06, "loss": 1.4121, "step": 24839 }, { "epoch": 0.68, "learning_rate": 4.9523285477851965e-06, "loss": 1.2571, "step": 24840 }, { "epoch": 0.68, "learning_rate": 4.951565011794731e-06, "loss": 1.373, "step": 24841 }, { "epoch": 0.68, "learning_rate": 4.950801515300844e-06, "loss": 1.1033, "step": 24842 }, { "epoch": 0.68, "learning_rate": 4.9500380583095175e-06, "loss": 1.2776, "step": 24843 }, { "epoch": 0.68, "learning_rate": 4.949274640826712e-06, "loss": 1.7759, "step": 24844 }, { "epoch": 0.68, "learning_rate": 4.9485112628584075e-06, "loss": 1.7632, "step": 24845 }, { "epoch": 0.68, "learning_rate": 4.947747924410579e-06, "loss": 1.3325, "step": 24846 }, { "epoch": 0.68, "learning_rate": 4.946984625489194e-06, "loss": 1.3228, "step": 24847 }, { "epoch": 0.68, "learning_rate": 4.946221366100226e-06, "loss": 1.2358, "step": 24848 }, { "epoch": 0.68, "learning_rate": 4.945458146249641e-06, "loss": 1.3225, "step": 24849 }, { "epoch": 0.68, "learning_rate": 4.94469496594342e-06, "loss": 1.3987, "step": 24850 }, { "epoch": 0.68, "learning_rate": 4.943931825187527e-06, "loss": 1.3208, "step": 24851 }, { "epoch": 0.68, "learning_rate": 4.943168723987935e-06, "loss": 1.1697, "step": 24852 }, { "epoch": 0.68, "learning_rate": 4.942405662350608e-06, "loss": 1.3052, "step": 24853 }, { "epoch": 0.68, "learning_rate": 4.941642640281524e-06, "loss": 1.2268, "step": 24854 }, { "epoch": 0.68, "learning_rate": 4.940879657786651e-06, "loss": 1.2524, "step": 24855 }, { "epoch": 0.68, "learning_rate": 4.940116714871957e-06, "loss": 1.3254, "step": 24856 }, { "epoch": 0.68, "learning_rate": 4.939353811543405e-06, "loss": 1.1565, "step": 24857 }, { "epoch": 0.68, "learning_rate": 4.938590947806974e-06, "loss": 1.1729, "step": 24858 }, { "epoch": 0.68, "learning_rate": 4.937828123668627e-06, "loss": 1.1047, "step": 24859 }, { "epoch": 0.68, "learning_rate": 4.937065339134333e-06, "loss": 1.3181, "step": 24860 }, { "epoch": 0.68, "learning_rate": 4.936302594210054e-06, "loss": 1.2712, "step": 24861 }, { "epoch": 0.68, "learning_rate": 4.935539888901767e-06, "loss": 1.3, "step": 24862 }, { "epoch": 0.68, "learning_rate": 4.934777223215434e-06, "loss": 1.3079, "step": 24863 }, { "epoch": 0.68, "learning_rate": 4.934014597157019e-06, "loss": 1.3711, "step": 24864 }, { "epoch": 0.68, "learning_rate": 4.933252010732495e-06, "loss": 1.4873, "step": 24865 }, { "epoch": 0.68, "learning_rate": 4.932489463947825e-06, "loss": 1.2446, "step": 24866 }, { "epoch": 0.68, "learning_rate": 4.931726956808975e-06, "loss": 1.269, "step": 24867 }, { "epoch": 0.68, "learning_rate": 4.930964489321904e-06, "loss": 1.3508, "step": 24868 }, { "epoch": 0.68, "learning_rate": 4.930202061492588e-06, "loss": 1.2917, "step": 24869 }, { "epoch": 0.68, "learning_rate": 4.929439673326989e-06, "loss": 1.2208, "step": 24870 }, { "epoch": 0.68, "learning_rate": 4.928677324831068e-06, "loss": 1.1521, "step": 24871 }, { "epoch": 0.68, "learning_rate": 4.927915016010787e-06, "loss": 1.3855, "step": 24872 }, { "epoch": 0.68, "learning_rate": 4.927152746872118e-06, "loss": 1.2258, "step": 24873 }, { "epoch": 0.68, "learning_rate": 4.9263905174210205e-06, "loss": 1.3054, "step": 24874 }, { "epoch": 0.68, "learning_rate": 4.925628327663458e-06, "loss": 1.217, "step": 24875 }, { "epoch": 0.68, "learning_rate": 4.924866177605389e-06, "loss": 1.0928, "step": 24876 }, { "epoch": 0.68, "learning_rate": 4.9241040672527805e-06, "loss": 1.3921, "step": 24877 }, { "epoch": 0.68, "learning_rate": 4.923341996611604e-06, "loss": 1.2468, "step": 24878 }, { "epoch": 0.68, "learning_rate": 4.922579965687804e-06, "loss": 1.4004, "step": 24879 }, { "epoch": 0.68, "learning_rate": 4.921817974487354e-06, "loss": 1.6357, "step": 24880 }, { "epoch": 0.68, "learning_rate": 4.921056023016208e-06, "loss": 1.2466, "step": 24881 }, { "epoch": 0.68, "learning_rate": 4.9202941112803404e-06, "loss": 1.2632, "step": 24882 }, { "epoch": 0.68, "learning_rate": 4.919532239285695e-06, "loss": 1.2588, "step": 24883 }, { "epoch": 0.68, "learning_rate": 4.918770407038244e-06, "loss": 1.3628, "step": 24884 }, { "epoch": 0.68, "learning_rate": 4.9180086145439394e-06, "loss": 1.4302, "step": 24885 }, { "epoch": 0.68, "learning_rate": 4.9172468618087544e-06, "loss": 1.3823, "step": 24886 }, { "epoch": 0.68, "learning_rate": 4.916485148838632e-06, "loss": 1.2212, "step": 24887 }, { "epoch": 0.68, "learning_rate": 4.915723475639544e-06, "loss": 1.345, "step": 24888 }, { "epoch": 0.68, "learning_rate": 4.914961842217439e-06, "loss": 1.2056, "step": 24889 }, { "epoch": 0.68, "learning_rate": 4.91420024857829e-06, "loss": 1.2671, "step": 24890 }, { "epoch": 0.68, "learning_rate": 4.913438694728039e-06, "loss": 1.186, "step": 24891 }, { "epoch": 0.68, "learning_rate": 4.912677180672653e-06, "loss": 1.2485, "step": 24892 }, { "epoch": 0.68, "learning_rate": 4.91191570641809e-06, "loss": 1.3057, "step": 24893 }, { "epoch": 0.68, "learning_rate": 4.911154271970308e-06, "loss": 1.3423, "step": 24894 }, { "epoch": 0.68, "learning_rate": 4.910392877335261e-06, "loss": 1.0255, "step": 24895 }, { "epoch": 0.68, "learning_rate": 4.909631522518903e-06, "loss": 1.2944, "step": 24896 }, { "epoch": 0.68, "learning_rate": 4.908870207527199e-06, "loss": 1.1157, "step": 24897 }, { "epoch": 0.68, "learning_rate": 4.908108932366099e-06, "loss": 1.644, "step": 24898 }, { "epoch": 0.68, "learning_rate": 4.9073476970415615e-06, "loss": 1.3972, "step": 24899 }, { "epoch": 0.68, "learning_rate": 4.906586501559537e-06, "loss": 1.1709, "step": 24900 }, { "epoch": 0.68, "learning_rate": 4.905825345925988e-06, "loss": 1.1604, "step": 24901 }, { "epoch": 0.68, "learning_rate": 4.905064230146865e-06, "loss": 1.2961, "step": 24902 }, { "epoch": 0.68, "learning_rate": 4.904303154228126e-06, "loss": 1.3503, "step": 24903 }, { "epoch": 0.68, "learning_rate": 4.903542118175718e-06, "loss": 1.7842, "step": 24904 }, { "epoch": 0.68, "learning_rate": 4.902781121995604e-06, "loss": 1.1902, "step": 24905 }, { "epoch": 0.68, "learning_rate": 4.902020165693733e-06, "loss": 1.3208, "step": 24906 }, { "epoch": 0.68, "learning_rate": 4.9012592492760555e-06, "loss": 1.2219, "step": 24907 }, { "epoch": 0.68, "learning_rate": 4.900498372748532e-06, "loss": 1.3044, "step": 24908 }, { "epoch": 0.68, "learning_rate": 4.8997375361171104e-06, "loss": 1.5659, "step": 24909 }, { "epoch": 0.68, "learning_rate": 4.898976739387745e-06, "loss": 1.3276, "step": 24910 }, { "epoch": 0.68, "learning_rate": 4.8982159825663835e-06, "loss": 1.2234, "step": 24911 }, { "epoch": 0.68, "learning_rate": 4.897455265658985e-06, "loss": 1.3357, "step": 24912 }, { "epoch": 0.68, "learning_rate": 4.896694588671496e-06, "loss": 1.3792, "step": 24913 }, { "epoch": 0.68, "learning_rate": 4.895933951609869e-06, "loss": 1.3225, "step": 24914 }, { "epoch": 0.68, "learning_rate": 4.895173354480051e-06, "loss": 1.3135, "step": 24915 }, { "epoch": 0.68, "learning_rate": 4.8944127972879995e-06, "loss": 1.2263, "step": 24916 }, { "epoch": 0.68, "learning_rate": 4.893652280039662e-06, "loss": 1.2839, "step": 24917 }, { "epoch": 0.68, "learning_rate": 4.8928918027409886e-06, "loss": 1.2817, "step": 24918 }, { "epoch": 0.68, "learning_rate": 4.8921313653979245e-06, "loss": 1.2256, "step": 24919 }, { "epoch": 0.68, "learning_rate": 4.891370968016425e-06, "loss": 1.3745, "step": 24920 }, { "epoch": 0.68, "learning_rate": 4.890610610602437e-06, "loss": 1.3359, "step": 24921 }, { "epoch": 0.68, "learning_rate": 4.889850293161911e-06, "loss": 1.2285, "step": 24922 }, { "epoch": 0.68, "learning_rate": 4.889090015700787e-06, "loss": 1.2385, "step": 24923 }, { "epoch": 0.68, "learning_rate": 4.888329778225021e-06, "loss": 1.1829, "step": 24924 }, { "epoch": 0.68, "learning_rate": 4.887569580740567e-06, "loss": 1.3069, "step": 24925 }, { "epoch": 0.68, "learning_rate": 4.886809423253355e-06, "loss": 1.248, "step": 24926 }, { "epoch": 0.68, "learning_rate": 4.886049305769347e-06, "loss": 1.3269, "step": 24927 }, { "epoch": 0.68, "learning_rate": 4.885289228294481e-06, "loss": 1.4077, "step": 24928 }, { "epoch": 0.68, "learning_rate": 4.8845291908347135e-06, "loss": 1.3926, "step": 24929 }, { "epoch": 0.68, "learning_rate": 4.883769193395976e-06, "loss": 1.3044, "step": 24930 }, { "epoch": 0.68, "learning_rate": 4.883009235984229e-06, "loss": 1.3271, "step": 24931 }, { "epoch": 0.68, "learning_rate": 4.882249318605406e-06, "loss": 1.2605, "step": 24932 }, { "epoch": 0.68, "learning_rate": 4.881489441265461e-06, "loss": 1.282, "step": 24933 }, { "epoch": 0.68, "learning_rate": 4.880729603970335e-06, "loss": 1.2798, "step": 24934 }, { "epoch": 0.68, "learning_rate": 4.879969806725976e-06, "loss": 1.1819, "step": 24935 }, { "epoch": 0.68, "learning_rate": 4.87921004953832e-06, "loss": 1.3198, "step": 24936 }, { "epoch": 0.68, "learning_rate": 4.878450332413321e-06, "loss": 1.3113, "step": 24937 }, { "epoch": 0.68, "learning_rate": 4.877690655356918e-06, "loss": 1.1469, "step": 24938 }, { "epoch": 0.68, "learning_rate": 4.876931018375052e-06, "loss": 1.2234, "step": 24939 }, { "epoch": 0.68, "learning_rate": 4.876171421473671e-06, "loss": 1.2957, "step": 24940 }, { "epoch": 0.68, "learning_rate": 4.875411864658715e-06, "loss": 1.2493, "step": 24941 }, { "epoch": 0.68, "learning_rate": 4.874652347936128e-06, "loss": 1.2322, "step": 24942 }, { "epoch": 0.68, "learning_rate": 4.873892871311847e-06, "loss": 1.2944, "step": 24943 }, { "epoch": 0.68, "learning_rate": 4.873133434791822e-06, "loss": 1.2939, "step": 24944 }, { "epoch": 0.68, "learning_rate": 4.872374038381989e-06, "loss": 1.7637, "step": 24945 }, { "epoch": 0.68, "learning_rate": 4.871614682088291e-06, "loss": 1.3225, "step": 24946 }, { "epoch": 0.68, "learning_rate": 4.870855365916665e-06, "loss": 1.0996, "step": 24947 }, { "epoch": 0.68, "learning_rate": 4.870096089873058e-06, "loss": 1.1934, "step": 24948 }, { "epoch": 0.68, "learning_rate": 4.869336853963407e-06, "loss": 1.2573, "step": 24949 }, { "epoch": 0.68, "learning_rate": 4.868577658193651e-06, "loss": 1.4036, "step": 24950 }, { "epoch": 0.68, "learning_rate": 4.867818502569727e-06, "loss": 1.3579, "step": 24951 }, { "epoch": 0.68, "learning_rate": 4.867059387097582e-06, "loss": 1.3506, "step": 24952 }, { "epoch": 0.68, "learning_rate": 4.866300311783151e-06, "loss": 1.228, "step": 24953 }, { "epoch": 0.68, "learning_rate": 4.865541276632367e-06, "loss": 1.3904, "step": 24954 }, { "epoch": 0.68, "learning_rate": 4.8647822816511794e-06, "loss": 1.3223, "step": 24955 }, { "epoch": 0.68, "learning_rate": 4.864023326845518e-06, "loss": 1.3542, "step": 24956 }, { "epoch": 0.68, "learning_rate": 4.863264412221326e-06, "loss": 1.3352, "step": 24957 }, { "epoch": 0.68, "learning_rate": 4.862505537784532e-06, "loss": 1.3516, "step": 24958 }, { "epoch": 0.68, "learning_rate": 4.861746703541082e-06, "loss": 1.3589, "step": 24959 }, { "epoch": 0.68, "learning_rate": 4.860987909496912e-06, "loss": 1.2966, "step": 24960 }, { "epoch": 0.68, "learning_rate": 4.860229155657954e-06, "loss": 1.4417, "step": 24961 }, { "epoch": 0.68, "learning_rate": 4.859470442030144e-06, "loss": 1.1558, "step": 24962 }, { "epoch": 0.68, "learning_rate": 4.8587117686194226e-06, "loss": 1.259, "step": 24963 }, { "epoch": 0.68, "learning_rate": 4.857953135431723e-06, "loss": 1.4058, "step": 24964 }, { "epoch": 0.68, "learning_rate": 4.85719454247298e-06, "loss": 1.2874, "step": 24965 }, { "epoch": 0.68, "learning_rate": 4.856435989749125e-06, "loss": 1.2095, "step": 24966 }, { "epoch": 0.68, "learning_rate": 4.855677477266101e-06, "loss": 1.2825, "step": 24967 }, { "epoch": 0.68, "learning_rate": 4.854919005029833e-06, "loss": 1.1985, "step": 24968 }, { "epoch": 0.68, "learning_rate": 4.854160573046262e-06, "loss": 1.3293, "step": 24969 }, { "epoch": 0.68, "learning_rate": 4.8534021813213196e-06, "loss": 1.355, "step": 24970 }, { "epoch": 0.68, "learning_rate": 4.852643829860935e-06, "loss": 1.2339, "step": 24971 }, { "epoch": 0.68, "learning_rate": 4.851885518671047e-06, "loss": 1.3062, "step": 24972 }, { "epoch": 0.68, "learning_rate": 4.851127247757587e-06, "loss": 1.438, "step": 24973 }, { "epoch": 0.68, "learning_rate": 4.8503690171264865e-06, "loss": 1.2542, "step": 24974 }, { "epoch": 0.68, "learning_rate": 4.8496108267836726e-06, "loss": 1.3423, "step": 24975 }, { "epoch": 0.68, "learning_rate": 4.848852676735087e-06, "loss": 1.2649, "step": 24976 }, { "epoch": 0.68, "learning_rate": 4.848094566986654e-06, "loss": 1.2881, "step": 24977 }, { "epoch": 0.68, "learning_rate": 4.847336497544308e-06, "loss": 1.2363, "step": 24978 }, { "epoch": 0.68, "learning_rate": 4.8465784684139735e-06, "loss": 1.3464, "step": 24979 }, { "epoch": 0.68, "learning_rate": 4.84582047960159e-06, "loss": 1.2742, "step": 24980 }, { "epoch": 0.68, "learning_rate": 4.845062531113084e-06, "loss": 1.356, "step": 24981 }, { "epoch": 0.68, "learning_rate": 4.844304622954383e-06, "loss": 1.1677, "step": 24982 }, { "epoch": 0.68, "learning_rate": 4.843546755131416e-06, "loss": 1.1992, "step": 24983 }, { "epoch": 0.68, "learning_rate": 4.842788927650118e-06, "loss": 1.2688, "step": 24984 }, { "epoch": 0.68, "learning_rate": 4.842031140516414e-06, "loss": 1.2017, "step": 24985 }, { "epoch": 0.68, "learning_rate": 4.841273393736229e-06, "loss": 1.1997, "step": 24986 }, { "epoch": 0.68, "learning_rate": 4.840515687315499e-06, "loss": 1.2761, "step": 24987 }, { "epoch": 0.68, "learning_rate": 4.839758021260149e-06, "loss": 1.4492, "step": 24988 }, { "epoch": 0.68, "learning_rate": 4.839000395576105e-06, "loss": 1.3457, "step": 24989 }, { "epoch": 0.68, "learning_rate": 4.838242810269291e-06, "loss": 1.2893, "step": 24990 }, { "epoch": 0.68, "learning_rate": 4.837485265345642e-06, "loss": 1.2009, "step": 24991 }, { "epoch": 0.68, "learning_rate": 4.836727760811081e-06, "loss": 1.4199, "step": 24992 }, { "epoch": 0.68, "learning_rate": 4.835970296671533e-06, "loss": 1.1018, "step": 24993 }, { "epoch": 0.68, "learning_rate": 4.835212872932923e-06, "loss": 1.2415, "step": 24994 }, { "epoch": 0.68, "learning_rate": 4.834455489601182e-06, "loss": 1.2678, "step": 24995 }, { "epoch": 0.68, "learning_rate": 4.8336981466822315e-06, "loss": 1.3723, "step": 24996 }, { "epoch": 0.68, "learning_rate": 4.832940844181998e-06, "loss": 1.3245, "step": 24997 }, { "epoch": 0.68, "learning_rate": 4.832183582106401e-06, "loss": 1.2209, "step": 24998 }, { "epoch": 0.68, "learning_rate": 4.8314263604613745e-06, "loss": 1.7109, "step": 24999 }, { "epoch": 0.68, "learning_rate": 4.830669179252837e-06, "loss": 1.3687, "step": 25000 }, { "epoch": 0.68, "learning_rate": 4.829912038486709e-06, "loss": 1.3792, "step": 25001 }, { "epoch": 0.68, "learning_rate": 4.829154938168923e-06, "loss": 1.2573, "step": 25002 }, { "epoch": 0.68, "learning_rate": 4.828397878305393e-06, "loss": 1.2073, "step": 25003 }, { "epoch": 0.68, "learning_rate": 4.8276408589020544e-06, "loss": 1.1326, "step": 25004 }, { "epoch": 0.68, "learning_rate": 4.826883879964812e-06, "loss": 1.3616, "step": 25005 }, { "epoch": 0.68, "learning_rate": 4.8261269414996025e-06, "loss": 1.2588, "step": 25006 }, { "epoch": 0.68, "learning_rate": 4.82537004351234e-06, "loss": 1.2656, "step": 25007 }, { "epoch": 0.68, "learning_rate": 4.824613186008955e-06, "loss": 1.3101, "step": 25008 }, { "epoch": 0.68, "learning_rate": 4.823856368995356e-06, "loss": 1.2844, "step": 25009 }, { "epoch": 0.68, "learning_rate": 4.823099592477474e-06, "loss": 1.3342, "step": 25010 }, { "epoch": 0.68, "learning_rate": 4.822342856461223e-06, "loss": 1.2864, "step": 25011 }, { "epoch": 0.68, "learning_rate": 4.821586160952534e-06, "loss": 1.3914, "step": 25012 }, { "epoch": 0.68, "learning_rate": 4.820829505957313e-06, "loss": 1.2212, "step": 25013 }, { "epoch": 0.68, "learning_rate": 4.82007289148149e-06, "loss": 1.2532, "step": 25014 }, { "epoch": 0.68, "learning_rate": 4.8193163175309765e-06, "loss": 1.3765, "step": 25015 }, { "epoch": 0.68, "learning_rate": 4.8185597841117005e-06, "loss": 1.772, "step": 25016 }, { "epoch": 0.68, "learning_rate": 4.817803291229577e-06, "loss": 1.772, "step": 25017 }, { "epoch": 0.68, "learning_rate": 4.817046838890519e-06, "loss": 1.1736, "step": 25018 }, { "epoch": 0.68, "learning_rate": 4.816290427100453e-06, "loss": 1.3044, "step": 25019 }, { "epoch": 0.68, "learning_rate": 4.815534055865293e-06, "loss": 1.1392, "step": 25020 }, { "epoch": 0.68, "learning_rate": 4.814777725190956e-06, "loss": 1.2632, "step": 25021 }, { "epoch": 0.68, "learning_rate": 4.814021435083358e-06, "loss": 1.4392, "step": 25022 }, { "epoch": 0.68, "learning_rate": 4.81326518554842e-06, "loss": 1.2009, "step": 25023 }, { "epoch": 0.68, "learning_rate": 4.812508976592057e-06, "loss": 1.1768, "step": 25024 }, { "epoch": 0.68, "learning_rate": 4.811752808220185e-06, "loss": 1.3506, "step": 25025 }, { "epoch": 0.68, "learning_rate": 4.810996680438714e-06, "loss": 1.3247, "step": 25026 }, { "epoch": 0.68, "learning_rate": 4.810240593253569e-06, "loss": 1.2527, "step": 25027 }, { "epoch": 0.68, "learning_rate": 4.809484546670662e-06, "loss": 1.23, "step": 25028 }, { "epoch": 0.68, "learning_rate": 4.808728540695906e-06, "loss": 1.2603, "step": 25029 }, { "epoch": 0.68, "learning_rate": 4.807972575335215e-06, "loss": 1.3098, "step": 25030 }, { "epoch": 0.68, "learning_rate": 4.807216650594507e-06, "loss": 1.2412, "step": 25031 }, { "epoch": 0.68, "learning_rate": 4.806460766479695e-06, "loss": 1.2593, "step": 25032 }, { "epoch": 0.68, "learning_rate": 4.805704922996688e-06, "loss": 1.2783, "step": 25033 }, { "epoch": 0.68, "learning_rate": 4.804949120151406e-06, "loss": 1.2324, "step": 25034 }, { "epoch": 0.68, "learning_rate": 4.80419335794976e-06, "loss": 1.4133, "step": 25035 }, { "epoch": 0.68, "learning_rate": 4.803437636397662e-06, "loss": 1.1655, "step": 25036 }, { "epoch": 0.68, "learning_rate": 4.8026819555010205e-06, "loss": 1.269, "step": 25037 }, { "epoch": 0.68, "learning_rate": 4.8019263152657545e-06, "loss": 1.3325, "step": 25038 }, { "epoch": 0.68, "learning_rate": 4.8011707156977735e-06, "loss": 1.1758, "step": 25039 }, { "epoch": 0.68, "learning_rate": 4.800415156802987e-06, "loss": 1.2778, "step": 25040 }, { "epoch": 0.68, "learning_rate": 4.799659638587305e-06, "loss": 1.2898, "step": 25041 }, { "epoch": 0.68, "learning_rate": 4.7989041610566446e-06, "loss": 1.3728, "step": 25042 }, { "epoch": 0.68, "learning_rate": 4.798148724216911e-06, "loss": 1.2522, "step": 25043 }, { "epoch": 0.68, "learning_rate": 4.797393328074017e-06, "loss": 1.2585, "step": 25044 }, { "epoch": 0.68, "learning_rate": 4.796637972633866e-06, "loss": 1.4424, "step": 25045 }, { "epoch": 0.68, "learning_rate": 4.7958826579023774e-06, "loss": 1.3757, "step": 25046 }, { "epoch": 0.68, "learning_rate": 4.795127383885455e-06, "loss": 1.3264, "step": 25047 }, { "epoch": 0.68, "learning_rate": 4.794372150589005e-06, "loss": 1.214, "step": 25048 }, { "epoch": 0.68, "learning_rate": 4.793616958018944e-06, "loss": 1.3403, "step": 25049 }, { "epoch": 0.68, "learning_rate": 4.792861806181172e-06, "loss": 1.3169, "step": 25050 }, { "epoch": 0.68, "learning_rate": 4.792106695081606e-06, "loss": 1.1338, "step": 25051 }, { "epoch": 0.68, "learning_rate": 4.791351624726143e-06, "loss": 1.2853, "step": 25052 }, { "epoch": 0.68, "learning_rate": 4.790596595120699e-06, "loss": 1.3855, "step": 25053 }, { "epoch": 0.68, "learning_rate": 4.789841606271173e-06, "loss": 1.4111, "step": 25054 }, { "epoch": 0.68, "learning_rate": 4.7890866581834835e-06, "loss": 1.1746, "step": 25055 }, { "epoch": 0.68, "learning_rate": 4.788331750863524e-06, "loss": 1.2058, "step": 25056 }, { "epoch": 0.68, "learning_rate": 4.787576884317209e-06, "loss": 1.3386, "step": 25057 }, { "epoch": 0.68, "learning_rate": 4.7868220585504366e-06, "loss": 1.1873, "step": 25058 }, { "epoch": 0.68, "learning_rate": 4.786067273569126e-06, "loss": 1.366, "step": 25059 }, { "epoch": 0.68, "learning_rate": 4.785312529379165e-06, "loss": 1.3662, "step": 25060 }, { "epoch": 0.68, "learning_rate": 4.78455782598647e-06, "loss": 1.2634, "step": 25061 }, { "epoch": 0.68, "learning_rate": 4.7838031633969395e-06, "loss": 1.4062, "step": 25062 }, { "epoch": 0.68, "learning_rate": 4.783048541616483e-06, "loss": 1.113, "step": 25063 }, { "epoch": 0.68, "learning_rate": 4.7822939606510025e-06, "loss": 1.2058, "step": 25064 }, { "epoch": 0.68, "learning_rate": 4.781539420506396e-06, "loss": 1.3652, "step": 25065 }, { "epoch": 0.68, "learning_rate": 4.780784921188575e-06, "loss": 1.3181, "step": 25066 }, { "epoch": 0.68, "learning_rate": 4.7800304627034386e-06, "loss": 1.2661, "step": 25067 }, { "epoch": 0.68, "learning_rate": 4.77927604505689e-06, "loss": 1.2087, "step": 25068 }, { "epoch": 0.68, "learning_rate": 4.778521668254825e-06, "loss": 1.3464, "step": 25069 }, { "epoch": 0.68, "learning_rate": 4.777767332303157e-06, "loss": 1.2893, "step": 25070 }, { "epoch": 0.68, "learning_rate": 4.7770130372077805e-06, "loss": 1.1926, "step": 25071 }, { "epoch": 0.68, "learning_rate": 4.776258782974599e-06, "loss": 1.2949, "step": 25072 }, { "epoch": 0.68, "learning_rate": 4.775504569609507e-06, "loss": 1.3035, "step": 25073 }, { "epoch": 0.68, "learning_rate": 4.774750397118416e-06, "loss": 1.2795, "step": 25074 }, { "epoch": 0.68, "learning_rate": 4.77399626550722e-06, "loss": 1.4443, "step": 25075 }, { "epoch": 0.68, "learning_rate": 4.773242174781819e-06, "loss": 1.3525, "step": 25076 }, { "epoch": 0.68, "learning_rate": 4.772488124948111e-06, "loss": 1.3247, "step": 25077 }, { "epoch": 0.68, "learning_rate": 4.771734116012001e-06, "loss": 1.3206, "step": 25078 }, { "epoch": 0.68, "learning_rate": 4.770980147979385e-06, "loss": 1.2412, "step": 25079 }, { "epoch": 0.68, "learning_rate": 4.7702262208561575e-06, "loss": 1.3118, "step": 25080 }, { "epoch": 0.68, "learning_rate": 4.769472334648224e-06, "loss": 1.0675, "step": 25081 }, { "epoch": 0.68, "learning_rate": 4.76871848936148e-06, "loss": 1.3721, "step": 25082 }, { "epoch": 0.69, "learning_rate": 4.767964685001823e-06, "loss": 1.0837, "step": 25083 }, { "epoch": 0.69, "learning_rate": 4.767210921575146e-06, "loss": 1.0332, "step": 25084 }, { "epoch": 0.69, "learning_rate": 4.766457199087354e-06, "loss": 1.3169, "step": 25085 }, { "epoch": 0.69, "learning_rate": 4.76570351754434e-06, "loss": 1.4622, "step": 25086 }, { "epoch": 0.69, "learning_rate": 4.764949876952e-06, "loss": 1.3484, "step": 25087 }, { "epoch": 0.69, "learning_rate": 4.764196277316226e-06, "loss": 1.1746, "step": 25088 }, { "epoch": 0.69, "learning_rate": 4.763442718642924e-06, "loss": 1.3574, "step": 25089 }, { "epoch": 0.69, "learning_rate": 4.762689200937981e-06, "loss": 1.2585, "step": 25090 }, { "epoch": 0.69, "learning_rate": 4.7619357242072974e-06, "loss": 1.2437, "step": 25091 }, { "epoch": 0.69, "learning_rate": 4.76118228845676e-06, "loss": 1.1937, "step": 25092 }, { "epoch": 0.69, "learning_rate": 4.760428893692274e-06, "loss": 1.2515, "step": 25093 }, { "epoch": 0.69, "learning_rate": 4.759675539919728e-06, "loss": 1.1846, "step": 25094 }, { "epoch": 0.69, "learning_rate": 4.7589222271450134e-06, "loss": 1.3235, "step": 25095 }, { "epoch": 0.69, "learning_rate": 4.758168955374029e-06, "loss": 1.0994, "step": 25096 }, { "epoch": 0.69, "learning_rate": 4.757415724612663e-06, "loss": 1.3079, "step": 25097 }, { "epoch": 0.69, "learning_rate": 4.756662534866818e-06, "loss": 1.2947, "step": 25098 }, { "epoch": 0.69, "learning_rate": 4.755909386142373e-06, "loss": 1.2292, "step": 25099 }, { "epoch": 0.69, "learning_rate": 4.755156278445231e-06, "loss": 1.3687, "step": 25100 }, { "epoch": 0.69, "learning_rate": 4.754403211781276e-06, "loss": 1.25, "step": 25101 }, { "epoch": 0.69, "learning_rate": 4.75365018615641e-06, "loss": 1.208, "step": 25102 }, { "epoch": 0.69, "learning_rate": 4.752897201576512e-06, "loss": 1.2969, "step": 25103 }, { "epoch": 0.69, "learning_rate": 4.752144258047482e-06, "loss": 1.3105, "step": 25104 }, { "epoch": 0.69, "learning_rate": 4.751391355575203e-06, "loss": 1.4856, "step": 25105 }, { "epoch": 0.69, "learning_rate": 4.750638494165579e-06, "loss": 1.3464, "step": 25106 }, { "epoch": 0.69, "learning_rate": 4.7498856738244824e-06, "loss": 1.1797, "step": 25107 }, { "epoch": 0.69, "learning_rate": 4.749132894557816e-06, "loss": 1.1782, "step": 25108 }, { "epoch": 0.69, "learning_rate": 4.74838015637146e-06, "loss": 1.3552, "step": 25109 }, { "epoch": 0.69, "learning_rate": 4.747627459271314e-06, "loss": 1.1692, "step": 25110 }, { "epoch": 0.69, "learning_rate": 4.746874803263258e-06, "loss": 1.3638, "step": 25111 }, { "epoch": 0.69, "learning_rate": 4.746122188353182e-06, "loss": 1.408, "step": 25112 }, { "epoch": 0.69, "learning_rate": 4.745369614546977e-06, "loss": 1.2922, "step": 25113 }, { "epoch": 0.69, "learning_rate": 4.744617081850531e-06, "loss": 1.3464, "step": 25114 }, { "epoch": 0.69, "learning_rate": 4.743864590269729e-06, "loss": 1.2473, "step": 25115 }, { "epoch": 0.69, "learning_rate": 4.743112139810455e-06, "loss": 1.2747, "step": 25116 }, { "epoch": 0.69, "learning_rate": 4.742359730478604e-06, "loss": 1.291, "step": 25117 }, { "epoch": 0.69, "learning_rate": 4.741607362280059e-06, "loss": 1.3103, "step": 25118 }, { "epoch": 0.69, "learning_rate": 4.740855035220704e-06, "loss": 1.2686, "step": 25119 }, { "epoch": 0.69, "learning_rate": 4.740102749306422e-06, "loss": 1.2063, "step": 25120 }, { "epoch": 0.69, "learning_rate": 4.7393505045431064e-06, "loss": 1.4009, "step": 25121 }, { "epoch": 0.69, "learning_rate": 4.73859830093664e-06, "loss": 1.3501, "step": 25122 }, { "epoch": 0.69, "learning_rate": 4.7378461384929055e-06, "loss": 1.3916, "step": 25123 }, { "epoch": 0.69, "learning_rate": 4.737094017217785e-06, "loss": 1.2449, "step": 25124 }, { "epoch": 0.69, "learning_rate": 4.736341937117171e-06, "loss": 1.2402, "step": 25125 }, { "epoch": 0.69, "learning_rate": 4.735589898196941e-06, "loss": 1.7578, "step": 25126 }, { "epoch": 0.69, "learning_rate": 4.734837900462976e-06, "loss": 1.3054, "step": 25127 }, { "epoch": 0.69, "learning_rate": 4.7340859439211675e-06, "loss": 1.2156, "step": 25128 }, { "epoch": 0.69, "learning_rate": 4.7333340285773955e-06, "loss": 1.0906, "step": 25129 }, { "epoch": 0.69, "learning_rate": 4.7325821544375404e-06, "loss": 1.3535, "step": 25130 }, { "epoch": 0.69, "learning_rate": 4.731830321507482e-06, "loss": 1.2571, "step": 25131 }, { "epoch": 0.69, "learning_rate": 4.73107852979311e-06, "loss": 1.3184, "step": 25132 }, { "epoch": 0.69, "learning_rate": 4.730326779300301e-06, "loss": 1.333, "step": 25133 }, { "epoch": 0.69, "learning_rate": 4.729575070034938e-06, "loss": 1.2258, "step": 25134 }, { "epoch": 0.69, "learning_rate": 4.728823402002899e-06, "loss": 1.2847, "step": 25135 }, { "epoch": 0.69, "learning_rate": 4.728071775210069e-06, "loss": 1.1594, "step": 25136 }, { "epoch": 0.69, "learning_rate": 4.727320189662326e-06, "loss": 1.1576, "step": 25137 }, { "epoch": 0.69, "learning_rate": 4.726568645365553e-06, "loss": 1.4541, "step": 25138 }, { "epoch": 0.69, "learning_rate": 4.725817142325621e-06, "loss": 1.449, "step": 25139 }, { "epoch": 0.69, "learning_rate": 4.7250656805484165e-06, "loss": 1.2878, "step": 25140 }, { "epoch": 0.69, "learning_rate": 4.7243142600398235e-06, "loss": 1.2393, "step": 25141 }, { "epoch": 0.69, "learning_rate": 4.72356288080571e-06, "loss": 1.2908, "step": 25142 }, { "epoch": 0.69, "learning_rate": 4.7228115428519615e-06, "loss": 1.3169, "step": 25143 }, { "epoch": 0.69, "learning_rate": 4.722060246184451e-06, "loss": 1.1875, "step": 25144 }, { "epoch": 0.69, "learning_rate": 4.721308990809067e-06, "loss": 1.2788, "step": 25145 }, { "epoch": 0.69, "learning_rate": 4.720557776731672e-06, "loss": 1.2517, "step": 25146 }, { "epoch": 0.69, "learning_rate": 4.719806603958152e-06, "loss": 1.271, "step": 25147 }, { "epoch": 0.69, "learning_rate": 4.719055472494381e-06, "loss": 1.354, "step": 25148 }, { "epoch": 0.69, "learning_rate": 4.718304382346243e-06, "loss": 1.2898, "step": 25149 }, { "epoch": 0.69, "learning_rate": 4.7175533335196e-06, "loss": 1.4065, "step": 25150 }, { "epoch": 0.69, "learning_rate": 4.71680232602034e-06, "loss": 1.1995, "step": 25151 }, { "epoch": 0.69, "learning_rate": 4.71605135985433e-06, "loss": 1.2463, "step": 25152 }, { "epoch": 0.69, "learning_rate": 4.715300435027458e-06, "loss": 1.1953, "step": 25153 }, { "epoch": 0.69, "learning_rate": 4.714549551545582e-06, "loss": 1.2766, "step": 25154 }, { "epoch": 0.69, "learning_rate": 4.713798709414589e-06, "loss": 1.1365, "step": 25155 }, { "epoch": 0.69, "learning_rate": 4.713047908640344e-06, "loss": 1.2864, "step": 25156 }, { "epoch": 0.69, "learning_rate": 4.712297149228731e-06, "loss": 1.3269, "step": 25157 }, { "epoch": 0.69, "learning_rate": 4.71154643118562e-06, "loss": 1.3037, "step": 25158 }, { "epoch": 0.69, "learning_rate": 4.7107957545168785e-06, "loss": 1.3228, "step": 25159 }, { "epoch": 0.69, "learning_rate": 4.710045119228387e-06, "loss": 1.1255, "step": 25160 }, { "epoch": 0.69, "learning_rate": 4.709294525326015e-06, "loss": 1.7158, "step": 25161 }, { "epoch": 0.69, "learning_rate": 4.708543972815635e-06, "loss": 1.2749, "step": 25162 }, { "epoch": 0.69, "learning_rate": 4.707793461703114e-06, "loss": 1.2422, "step": 25163 }, { "epoch": 0.69, "learning_rate": 4.707042991994333e-06, "loss": 1.2751, "step": 25164 }, { "epoch": 0.69, "learning_rate": 4.706292563695159e-06, "loss": 1.4111, "step": 25165 }, { "epoch": 0.69, "learning_rate": 4.7055421768114616e-06, "loss": 1.0938, "step": 25166 }, { "epoch": 0.69, "learning_rate": 4.7047918313491105e-06, "loss": 1.2678, "step": 25167 }, { "epoch": 0.69, "learning_rate": 4.7040415273139805e-06, "loss": 1.2439, "step": 25168 }, { "epoch": 0.69, "learning_rate": 4.70329126471194e-06, "loss": 1.2581, "step": 25169 }, { "epoch": 0.69, "learning_rate": 4.702541043548857e-06, "loss": 1.1299, "step": 25170 }, { "epoch": 0.69, "learning_rate": 4.7017908638306e-06, "loss": 1.1758, "step": 25171 }, { "epoch": 0.69, "learning_rate": 4.701040725563042e-06, "loss": 1.2861, "step": 25172 }, { "epoch": 0.69, "learning_rate": 4.70029062875205e-06, "loss": 1.3359, "step": 25173 }, { "epoch": 0.69, "learning_rate": 4.6995405734034886e-06, "loss": 1.1506, "step": 25174 }, { "epoch": 0.69, "learning_rate": 4.698790559523232e-06, "loss": 1.219, "step": 25175 }, { "epoch": 0.69, "learning_rate": 4.698040587117146e-06, "loss": 1.1812, "step": 25176 }, { "epoch": 0.69, "learning_rate": 4.697290656191098e-06, "loss": 1.213, "step": 25177 }, { "epoch": 0.69, "learning_rate": 4.69654076675095e-06, "loss": 1.2119, "step": 25178 }, { "epoch": 0.69, "learning_rate": 4.695790918802577e-06, "loss": 1.2371, "step": 25179 }, { "epoch": 0.69, "learning_rate": 4.695041112351841e-06, "loss": 1.2612, "step": 25180 }, { "epoch": 0.69, "learning_rate": 4.694291347404609e-06, "loss": 1.4385, "step": 25181 }, { "epoch": 0.69, "learning_rate": 4.693541623966743e-06, "loss": 1.3599, "step": 25182 }, { "epoch": 0.69, "learning_rate": 4.692791942044116e-06, "loss": 1.2051, "step": 25183 }, { "epoch": 0.69, "learning_rate": 4.69204230164259e-06, "loss": 1.3586, "step": 25184 }, { "epoch": 0.69, "learning_rate": 4.691292702768028e-06, "loss": 1.3032, "step": 25185 }, { "epoch": 0.69, "learning_rate": 4.690543145426292e-06, "loss": 1.2437, "step": 25186 }, { "epoch": 0.69, "learning_rate": 4.6897936296232494e-06, "loss": 1.2886, "step": 25187 }, { "epoch": 0.69, "learning_rate": 4.689044155364773e-06, "loss": 1.241, "step": 25188 }, { "epoch": 0.69, "learning_rate": 4.688294722656709e-06, "loss": 1.2671, "step": 25189 }, { "epoch": 0.69, "learning_rate": 4.687545331504934e-06, "loss": 1.2104, "step": 25190 }, { "epoch": 0.69, "learning_rate": 4.686795981915301e-06, "loss": 1.025, "step": 25191 }, { "epoch": 0.69, "learning_rate": 4.6860466738936874e-06, "loss": 1.2893, "step": 25192 }, { "epoch": 0.69, "learning_rate": 4.685297407445937e-06, "loss": 1.2812, "step": 25193 }, { "epoch": 0.69, "learning_rate": 4.684548182577924e-06, "loss": 1.2681, "step": 25194 }, { "epoch": 0.69, "learning_rate": 4.683798999295504e-06, "loss": 1.2151, "step": 25195 }, { "epoch": 0.69, "learning_rate": 4.683049857604543e-06, "loss": 1.0913, "step": 25196 }, { "epoch": 0.69, "learning_rate": 4.682300757510902e-06, "loss": 1.1062, "step": 25197 }, { "epoch": 0.69, "learning_rate": 4.681551699020437e-06, "loss": 1.3208, "step": 25198 }, { "epoch": 0.69, "learning_rate": 4.680802682139008e-06, "loss": 1.2595, "step": 25199 }, { "epoch": 0.69, "learning_rate": 4.68005370687248e-06, "loss": 1.3079, "step": 25200 }, { "epoch": 0.69, "learning_rate": 4.679304773226711e-06, "loss": 1.4124, "step": 25201 }, { "epoch": 0.69, "learning_rate": 4.678555881207557e-06, "loss": 1.4409, "step": 25202 }, { "epoch": 0.69, "learning_rate": 4.677807030820882e-06, "loss": 1.1968, "step": 25203 }, { "epoch": 0.69, "learning_rate": 4.677058222072542e-06, "loss": 1.2864, "step": 25204 }, { "epoch": 0.69, "learning_rate": 4.676309454968396e-06, "loss": 1.1589, "step": 25205 }, { "epoch": 0.69, "learning_rate": 4.675560729514298e-06, "loss": 1.2551, "step": 25206 }, { "epoch": 0.69, "learning_rate": 4.674812045716111e-06, "loss": 1.3628, "step": 25207 }, { "epoch": 0.69, "learning_rate": 4.674063403579693e-06, "loss": 1.3064, "step": 25208 }, { "epoch": 0.69, "learning_rate": 4.673314803110898e-06, "loss": 1.3418, "step": 25209 }, { "epoch": 0.69, "learning_rate": 4.672566244315578e-06, "loss": 1.2148, "step": 25210 }, { "epoch": 0.69, "learning_rate": 4.6718177271995994e-06, "loss": 1.2756, "step": 25211 }, { "epoch": 0.69, "learning_rate": 4.671069251768812e-06, "loss": 1.2185, "step": 25212 }, { "epoch": 0.69, "learning_rate": 4.670320818029075e-06, "loss": 1.7197, "step": 25213 }, { "epoch": 0.69, "learning_rate": 4.669572425986237e-06, "loss": 1.396, "step": 25214 }, { "epoch": 0.69, "learning_rate": 4.668824075646161e-06, "loss": 1.2747, "step": 25215 }, { "epoch": 0.69, "learning_rate": 4.6680757670146995e-06, "loss": 1.176, "step": 25216 }, { "epoch": 0.69, "learning_rate": 4.667327500097706e-06, "loss": 1.2415, "step": 25217 }, { "epoch": 0.69, "learning_rate": 4.66657927490103e-06, "loss": 1.2305, "step": 25218 }, { "epoch": 0.69, "learning_rate": 4.665831091430534e-06, "loss": 1.3606, "step": 25219 }, { "epoch": 0.69, "learning_rate": 4.665082949692067e-06, "loss": 1.1777, "step": 25220 }, { "epoch": 0.69, "learning_rate": 4.664334849691479e-06, "loss": 1.1816, "step": 25221 }, { "epoch": 0.69, "learning_rate": 4.663586791434629e-06, "loss": 1.2073, "step": 25222 }, { "epoch": 0.69, "learning_rate": 4.662838774927367e-06, "loss": 1.2646, "step": 25223 }, { "epoch": 0.69, "learning_rate": 4.662090800175545e-06, "loss": 1.2456, "step": 25224 }, { "epoch": 0.69, "learning_rate": 4.661342867185011e-06, "loss": 1.2061, "step": 25225 }, { "epoch": 0.69, "learning_rate": 4.660594975961623e-06, "loss": 1.3748, "step": 25226 }, { "epoch": 0.69, "learning_rate": 4.65984712651123e-06, "loss": 1.115, "step": 25227 }, { "epoch": 0.69, "learning_rate": 4.659099318839682e-06, "loss": 1.3533, "step": 25228 }, { "epoch": 0.69, "learning_rate": 4.6583515529528246e-06, "loss": 1.3201, "step": 25229 }, { "epoch": 0.69, "learning_rate": 4.657603828856517e-06, "loss": 1.2261, "step": 25230 }, { "epoch": 0.69, "learning_rate": 4.656856146556602e-06, "loss": 1.1785, "step": 25231 }, { "epoch": 0.69, "learning_rate": 4.656108506058939e-06, "loss": 1.2358, "step": 25232 }, { "epoch": 0.69, "learning_rate": 4.6553609073693615e-06, "loss": 1.2603, "step": 25233 }, { "epoch": 0.69, "learning_rate": 4.6546133504937285e-06, "loss": 1.2542, "step": 25234 }, { "epoch": 0.69, "learning_rate": 4.653865835437891e-06, "loss": 1.2568, "step": 25235 }, { "epoch": 0.69, "learning_rate": 4.653118362207692e-06, "loss": 1.313, "step": 25236 }, { "epoch": 0.69, "learning_rate": 4.652370930808982e-06, "loss": 1.3076, "step": 25237 }, { "epoch": 0.69, "learning_rate": 4.6516235412476015e-06, "loss": 1.1777, "step": 25238 }, { "epoch": 0.69, "learning_rate": 4.650876193529409e-06, "loss": 1.1685, "step": 25239 }, { "epoch": 0.69, "learning_rate": 4.650128887660246e-06, "loss": 1.3179, "step": 25240 }, { "epoch": 0.69, "learning_rate": 4.649381623645957e-06, "loss": 1.231, "step": 25241 }, { "epoch": 0.69, "learning_rate": 4.6486344014923875e-06, "loss": 1.2502, "step": 25242 }, { "epoch": 0.69, "learning_rate": 4.64788722120539e-06, "loss": 1.2632, "step": 25243 }, { "epoch": 0.69, "learning_rate": 4.647140082790806e-06, "loss": 1.199, "step": 25244 }, { "epoch": 0.69, "learning_rate": 4.646392986254481e-06, "loss": 1.2329, "step": 25245 }, { "epoch": 0.69, "learning_rate": 4.645645931602256e-06, "loss": 1.2048, "step": 25246 }, { "epoch": 0.69, "learning_rate": 4.644898918839983e-06, "loss": 1.2229, "step": 25247 }, { "epoch": 0.69, "learning_rate": 4.644151947973503e-06, "loss": 1.4331, "step": 25248 }, { "epoch": 0.69, "learning_rate": 4.643405019008656e-06, "loss": 1.2268, "step": 25249 }, { "epoch": 0.69, "learning_rate": 4.642658131951293e-06, "loss": 1.178, "step": 25250 }, { "epoch": 0.69, "learning_rate": 4.641911286807252e-06, "loss": 1.2942, "step": 25251 }, { "epoch": 0.69, "learning_rate": 4.64116448358238e-06, "loss": 1.175, "step": 25252 }, { "epoch": 0.69, "learning_rate": 4.640417722282512e-06, "loss": 1.249, "step": 25253 }, { "epoch": 0.69, "learning_rate": 4.639671002913499e-06, "loss": 1.1304, "step": 25254 }, { "epoch": 0.69, "learning_rate": 4.638924325481181e-06, "loss": 1.6553, "step": 25255 }, { "epoch": 0.69, "learning_rate": 4.638177689991397e-06, "loss": 1.2202, "step": 25256 }, { "epoch": 0.69, "learning_rate": 4.637431096449985e-06, "loss": 0.96, "step": 25257 }, { "epoch": 0.69, "learning_rate": 4.636684544862796e-06, "loss": 1.2998, "step": 25258 }, { "epoch": 0.69, "learning_rate": 4.635938035235664e-06, "loss": 1.376, "step": 25259 }, { "epoch": 0.69, "learning_rate": 4.635191567574431e-06, "loss": 1.3044, "step": 25260 }, { "epoch": 0.69, "learning_rate": 4.634445141884932e-06, "loss": 1.2053, "step": 25261 }, { "epoch": 0.69, "learning_rate": 4.633698758173015e-06, "loss": 1.3196, "step": 25262 }, { "epoch": 0.69, "learning_rate": 4.632952416444516e-06, "loss": 1.2068, "step": 25263 }, { "epoch": 0.69, "learning_rate": 4.63220611670527e-06, "loss": 1.2957, "step": 25264 }, { "epoch": 0.69, "learning_rate": 4.631459858961123e-06, "loss": 1.3496, "step": 25265 }, { "epoch": 0.69, "learning_rate": 4.630713643217904e-06, "loss": 1.2349, "step": 25266 }, { "epoch": 0.69, "learning_rate": 4.6299674694814656e-06, "loss": 1.1804, "step": 25267 }, { "epoch": 0.69, "learning_rate": 4.629221337757629e-06, "loss": 1.2485, "step": 25268 }, { "epoch": 0.69, "learning_rate": 4.628475248052243e-06, "loss": 1.2622, "step": 25269 }, { "epoch": 0.69, "learning_rate": 4.6277292003711374e-06, "loss": 1.3511, "step": 25270 }, { "epoch": 0.69, "learning_rate": 4.626983194720159e-06, "loss": 1.2527, "step": 25271 }, { "epoch": 0.69, "learning_rate": 4.62623723110513e-06, "loss": 1.1497, "step": 25272 }, { "epoch": 0.69, "learning_rate": 4.625491309531899e-06, "loss": 1.3984, "step": 25273 }, { "epoch": 0.69, "learning_rate": 4.624745430006291e-06, "loss": 1.3525, "step": 25274 }, { "epoch": 0.69, "learning_rate": 4.623999592534156e-06, "loss": 1.1226, "step": 25275 }, { "epoch": 0.69, "learning_rate": 4.623253797121312e-06, "loss": 1.2961, "step": 25276 }, { "epoch": 0.69, "learning_rate": 4.622508043773607e-06, "loss": 1.1917, "step": 25277 }, { "epoch": 0.69, "learning_rate": 4.621762332496865e-06, "loss": 1.4407, "step": 25278 }, { "epoch": 0.69, "learning_rate": 4.6210166632969345e-06, "loss": 1.269, "step": 25279 }, { "epoch": 0.69, "learning_rate": 4.620271036179631e-06, "loss": 1.3447, "step": 25280 }, { "epoch": 0.69, "learning_rate": 4.619525451150798e-06, "loss": 1.3489, "step": 25281 }, { "epoch": 0.69, "learning_rate": 4.618779908216272e-06, "loss": 1.2083, "step": 25282 }, { "epoch": 0.69, "learning_rate": 4.618034407381882e-06, "loss": 1.2751, "step": 25283 }, { "epoch": 0.69, "learning_rate": 4.617288948653459e-06, "loss": 1.2703, "step": 25284 }, { "epoch": 0.69, "learning_rate": 4.616543532036832e-06, "loss": 1.1467, "step": 25285 }, { "epoch": 0.69, "learning_rate": 4.615798157537842e-06, "loss": 1.1714, "step": 25286 }, { "epoch": 0.69, "learning_rate": 4.615052825162315e-06, "loss": 1.3005, "step": 25287 }, { "epoch": 0.69, "learning_rate": 4.614307534916082e-06, "loss": 1.7197, "step": 25288 }, { "epoch": 0.69, "learning_rate": 4.61356228680497e-06, "loss": 1.2874, "step": 25289 }, { "epoch": 0.69, "learning_rate": 4.612817080834819e-06, "loss": 1.259, "step": 25290 }, { "epoch": 0.69, "learning_rate": 4.6120719170114535e-06, "loss": 1.4878, "step": 25291 }, { "epoch": 0.69, "learning_rate": 4.611326795340704e-06, "loss": 1.3052, "step": 25292 }, { "epoch": 0.69, "learning_rate": 4.610581715828395e-06, "loss": 1.313, "step": 25293 }, { "epoch": 0.69, "learning_rate": 4.609836678480364e-06, "loss": 1.2151, "step": 25294 }, { "epoch": 0.69, "learning_rate": 4.6090916833024366e-06, "loss": 1.3289, "step": 25295 }, { "epoch": 0.69, "learning_rate": 4.608346730300438e-06, "loss": 1.4053, "step": 25296 }, { "epoch": 0.69, "learning_rate": 4.607601819480202e-06, "loss": 1.1543, "step": 25297 }, { "epoch": 0.69, "learning_rate": 4.6068569508475545e-06, "loss": 1.3469, "step": 25298 }, { "epoch": 0.69, "learning_rate": 4.606112124408322e-06, "loss": 1.1519, "step": 25299 }, { "epoch": 0.69, "learning_rate": 4.605367340168327e-06, "loss": 1.415, "step": 25300 }, { "epoch": 0.69, "learning_rate": 4.604622598133406e-06, "loss": 1.2502, "step": 25301 }, { "epoch": 0.69, "learning_rate": 4.60387789830938e-06, "loss": 1.2803, "step": 25302 }, { "epoch": 0.69, "learning_rate": 4.603133240702077e-06, "loss": 1.228, "step": 25303 }, { "epoch": 0.69, "learning_rate": 4.602388625317317e-06, "loss": 1.2935, "step": 25304 }, { "epoch": 0.69, "learning_rate": 4.601644052160934e-06, "loss": 1.0389, "step": 25305 }, { "epoch": 0.69, "learning_rate": 4.6008995212387495e-06, "loss": 1.1194, "step": 25306 }, { "epoch": 0.69, "learning_rate": 4.6001550325565895e-06, "loss": 1.4287, "step": 25307 }, { "epoch": 0.69, "learning_rate": 4.599410586120272e-06, "loss": 1.2496, "step": 25308 }, { "epoch": 0.69, "learning_rate": 4.5986661819356315e-06, "loss": 1.1189, "step": 25309 }, { "epoch": 0.69, "learning_rate": 4.597921820008486e-06, "loss": 1.2561, "step": 25310 }, { "epoch": 0.69, "learning_rate": 4.597177500344658e-06, "loss": 1.2725, "step": 25311 }, { "epoch": 0.69, "learning_rate": 4.596433222949974e-06, "loss": 1.2124, "step": 25312 }, { "epoch": 0.69, "learning_rate": 4.595688987830252e-06, "loss": 1.0237, "step": 25313 }, { "epoch": 0.69, "learning_rate": 4.594944794991327e-06, "loss": 1.3386, "step": 25314 }, { "epoch": 0.69, "learning_rate": 4.594200644439004e-06, "loss": 1.3113, "step": 25315 }, { "epoch": 0.69, "learning_rate": 4.593456536179117e-06, "loss": 1.2908, "step": 25316 }, { "epoch": 0.69, "learning_rate": 4.592712470217481e-06, "loss": 1.3857, "step": 25317 }, { "epoch": 0.69, "learning_rate": 4.5919684465599255e-06, "loss": 1.3682, "step": 25318 }, { "epoch": 0.69, "learning_rate": 4.591224465212259e-06, "loss": 1.3201, "step": 25319 }, { "epoch": 0.69, "learning_rate": 4.590480526180313e-06, "loss": 1.1592, "step": 25320 }, { "epoch": 0.69, "learning_rate": 4.589736629469901e-06, "loss": 1.386, "step": 25321 }, { "epoch": 0.69, "learning_rate": 4.5889927750868515e-06, "loss": 1.1768, "step": 25322 }, { "epoch": 0.69, "learning_rate": 4.588248963036971e-06, "loss": 1.1272, "step": 25323 }, { "epoch": 0.69, "learning_rate": 4.587505193326089e-06, "loss": 1.3306, "step": 25324 }, { "epoch": 0.69, "learning_rate": 4.586761465960018e-06, "loss": 1.3396, "step": 25325 }, { "epoch": 0.69, "learning_rate": 4.5860177809445835e-06, "loss": 1.2495, "step": 25326 }, { "epoch": 0.69, "learning_rate": 4.5852741382856e-06, "loss": 1.3591, "step": 25327 }, { "epoch": 0.69, "learning_rate": 4.584530537988883e-06, "loss": 1.2874, "step": 25328 }, { "epoch": 0.69, "learning_rate": 4.583786980060254e-06, "loss": 1.2708, "step": 25329 }, { "epoch": 0.69, "learning_rate": 4.58304346450553e-06, "loss": 1.3093, "step": 25330 }, { "epoch": 0.69, "learning_rate": 4.5822999913305265e-06, "loss": 1.3589, "step": 25331 }, { "epoch": 0.69, "learning_rate": 4.581556560541057e-06, "loss": 1.1838, "step": 25332 }, { "epoch": 0.69, "learning_rate": 4.580813172142945e-06, "loss": 1.2678, "step": 25333 }, { "epoch": 0.69, "learning_rate": 4.580069826142002e-06, "loss": 1.3193, "step": 25334 }, { "epoch": 0.69, "learning_rate": 4.579326522544043e-06, "loss": 1.2593, "step": 25335 }, { "epoch": 0.69, "learning_rate": 4.578583261354882e-06, "loss": 1.2559, "step": 25336 }, { "epoch": 0.69, "learning_rate": 4.577840042580339e-06, "loss": 1.1801, "step": 25337 }, { "epoch": 0.69, "learning_rate": 4.577096866226227e-06, "loss": 1.1782, "step": 25338 }, { "epoch": 0.69, "learning_rate": 4.576353732298357e-06, "loss": 1.3645, "step": 25339 }, { "epoch": 0.69, "learning_rate": 4.575610640802544e-06, "loss": 1.2766, "step": 25340 }, { "epoch": 0.69, "learning_rate": 4.574867591744605e-06, "loss": 1.1787, "step": 25341 }, { "epoch": 0.69, "learning_rate": 4.5741245851303504e-06, "loss": 1.1433, "step": 25342 }, { "epoch": 0.69, "learning_rate": 4.573381620965591e-06, "loss": 1.261, "step": 25343 }, { "epoch": 0.69, "learning_rate": 4.572638699256144e-06, "loss": 1.2979, "step": 25344 }, { "epoch": 0.69, "learning_rate": 4.571895820007822e-06, "loss": 1.2219, "step": 25345 }, { "epoch": 0.69, "learning_rate": 4.571152983226434e-06, "loss": 1.2678, "step": 25346 }, { "epoch": 0.69, "learning_rate": 4.570410188917788e-06, "loss": 1.0635, "step": 25347 }, { "epoch": 0.69, "learning_rate": 4.569667437087703e-06, "loss": 1.0779, "step": 25348 }, { "epoch": 0.69, "learning_rate": 4.568924727741986e-06, "loss": 1.3506, "step": 25349 }, { "epoch": 0.69, "learning_rate": 4.568182060886449e-06, "loss": 1.2017, "step": 25350 }, { "epoch": 0.69, "learning_rate": 4.567439436526897e-06, "loss": 1.3044, "step": 25351 }, { "epoch": 0.69, "learning_rate": 4.566696854669148e-06, "loss": 1.2883, "step": 25352 }, { "epoch": 0.69, "learning_rate": 4.565954315319009e-06, "loss": 1.3633, "step": 25353 }, { "epoch": 0.69, "learning_rate": 4.565211818482287e-06, "loss": 1.6763, "step": 25354 }, { "epoch": 0.69, "learning_rate": 4.564469364164789e-06, "loss": 1.3865, "step": 25355 }, { "epoch": 0.69, "learning_rate": 4.563726952372331e-06, "loss": 1.2112, "step": 25356 }, { "epoch": 0.69, "learning_rate": 4.5629845831107155e-06, "loss": 1.3162, "step": 25357 }, { "epoch": 0.69, "learning_rate": 4.562242256385749e-06, "loss": 1.22, "step": 25358 }, { "epoch": 0.69, "learning_rate": 4.561499972203246e-06, "loss": 1.2893, "step": 25359 }, { "epoch": 0.69, "learning_rate": 4.560757730569006e-06, "loss": 1.3745, "step": 25360 }, { "epoch": 0.69, "learning_rate": 4.560015531488847e-06, "loss": 1.1987, "step": 25361 }, { "epoch": 0.69, "learning_rate": 4.559273374968562e-06, "loss": 1.3372, "step": 25362 }, { "epoch": 0.69, "learning_rate": 4.558531261013965e-06, "loss": 1.2205, "step": 25363 }, { "epoch": 0.69, "learning_rate": 4.557789189630859e-06, "loss": 1.3074, "step": 25364 }, { "epoch": 0.69, "learning_rate": 4.557047160825059e-06, "loss": 1.3147, "step": 25365 }, { "epoch": 0.69, "learning_rate": 4.556305174602353e-06, "loss": 1.0898, "step": 25366 }, { "epoch": 0.69, "learning_rate": 4.555563230968562e-06, "loss": 1.2644, "step": 25367 }, { "epoch": 0.69, "learning_rate": 4.554821329929479e-06, "loss": 1.0988, "step": 25368 }, { "epoch": 0.69, "learning_rate": 4.55407947149092e-06, "loss": 1.2312, "step": 25369 }, { "epoch": 0.69, "learning_rate": 4.5533376556586765e-06, "loss": 1.2705, "step": 25370 }, { "epoch": 0.69, "learning_rate": 4.552595882438561e-06, "loss": 1.2007, "step": 25371 }, { "epoch": 0.69, "learning_rate": 4.5518541518363694e-06, "loss": 1.3149, "step": 25372 }, { "epoch": 0.69, "learning_rate": 4.551112463857913e-06, "loss": 1.2952, "step": 25373 }, { "epoch": 0.69, "learning_rate": 4.550370818508991e-06, "loss": 1.3999, "step": 25374 }, { "epoch": 0.69, "learning_rate": 4.5496292157954014e-06, "loss": 1.2119, "step": 25375 }, { "epoch": 0.69, "learning_rate": 4.548887655722953e-06, "loss": 1.4092, "step": 25376 }, { "epoch": 0.69, "learning_rate": 4.548146138297445e-06, "loss": 1.2632, "step": 25377 }, { "epoch": 0.69, "learning_rate": 4.547404663524677e-06, "loss": 1.3809, "step": 25378 }, { "epoch": 0.69, "learning_rate": 4.546663231410449e-06, "loss": 1.1748, "step": 25379 }, { "epoch": 0.69, "learning_rate": 4.545921841960566e-06, "loss": 1.2837, "step": 25380 }, { "epoch": 0.69, "learning_rate": 4.545180495180826e-06, "loss": 1.2188, "step": 25381 }, { "epoch": 0.69, "learning_rate": 4.544439191077028e-06, "loss": 1.2952, "step": 25382 }, { "epoch": 0.69, "learning_rate": 4.54369792965497e-06, "loss": 1.3481, "step": 25383 }, { "epoch": 0.69, "learning_rate": 4.5429567109204566e-06, "loss": 1.3833, "step": 25384 }, { "epoch": 0.69, "learning_rate": 4.542215534879284e-06, "loss": 1.2268, "step": 25385 }, { "epoch": 0.69, "learning_rate": 4.54147440153725e-06, "loss": 1.6475, "step": 25386 }, { "epoch": 0.69, "learning_rate": 4.540733310900151e-06, "loss": 1.2507, "step": 25387 }, { "epoch": 0.69, "learning_rate": 4.53999226297379e-06, "loss": 1.2478, "step": 25388 }, { "epoch": 0.69, "learning_rate": 4.539251257763962e-06, "loss": 1.1868, "step": 25389 }, { "epoch": 0.69, "learning_rate": 4.538510295276462e-06, "loss": 1.1389, "step": 25390 }, { "epoch": 0.69, "learning_rate": 4.537769375517091e-06, "loss": 1.2854, "step": 25391 }, { "epoch": 0.69, "learning_rate": 4.537028498491646e-06, "loss": 1.3293, "step": 25392 }, { "epoch": 0.69, "learning_rate": 4.536287664205921e-06, "loss": 1.291, "step": 25393 }, { "epoch": 0.69, "learning_rate": 4.535546872665707e-06, "loss": 1.1528, "step": 25394 }, { "epoch": 0.69, "learning_rate": 4.534806123876809e-06, "loss": 1.2788, "step": 25395 }, { "epoch": 0.69, "learning_rate": 4.5340654178450184e-06, "loss": 1.282, "step": 25396 }, { "epoch": 0.69, "learning_rate": 4.533324754576128e-06, "loss": 1.2441, "step": 25397 }, { "epoch": 0.69, "learning_rate": 4.532584134075932e-06, "loss": 1.345, "step": 25398 }, { "epoch": 0.69, "learning_rate": 4.531843556350231e-06, "loss": 1.2095, "step": 25399 }, { "epoch": 0.69, "learning_rate": 4.5311030214048135e-06, "loss": 1.2671, "step": 25400 }, { "epoch": 0.69, "learning_rate": 4.530362529245474e-06, "loss": 1.1746, "step": 25401 }, { "epoch": 0.69, "learning_rate": 4.529622079878005e-06, "loss": 1.7563, "step": 25402 }, { "epoch": 0.69, "learning_rate": 4.5288816733082e-06, "loss": 1.3276, "step": 25403 }, { "epoch": 0.69, "learning_rate": 4.528141309541856e-06, "loss": 1.4473, "step": 25404 }, { "epoch": 0.69, "learning_rate": 4.527400988584756e-06, "loss": 1.1965, "step": 25405 }, { "epoch": 0.69, "learning_rate": 4.526660710442701e-06, "loss": 1.1851, "step": 25406 }, { "epoch": 0.69, "learning_rate": 4.525920475121475e-06, "loss": 1.2527, "step": 25407 }, { "epoch": 0.69, "learning_rate": 4.5251802826268795e-06, "loss": 1.1716, "step": 25408 }, { "epoch": 0.69, "learning_rate": 4.524440132964694e-06, "loss": 1.1677, "step": 25409 }, { "epoch": 0.69, "learning_rate": 4.523700026140716e-06, "loss": 1.4062, "step": 25410 }, { "epoch": 0.69, "learning_rate": 4.522959962160731e-06, "loss": 1.1963, "step": 25411 }, { "epoch": 0.69, "learning_rate": 4.522219941030539e-06, "loss": 1.2576, "step": 25412 }, { "epoch": 0.69, "learning_rate": 4.521479962755915e-06, "loss": 1.1566, "step": 25413 }, { "epoch": 0.69, "learning_rate": 4.520740027342658e-06, "loss": 1.2209, "step": 25414 }, { "epoch": 0.69, "learning_rate": 4.520000134796553e-06, "loss": 1.2012, "step": 25415 }, { "epoch": 0.69, "learning_rate": 4.519260285123396e-06, "loss": 1.2349, "step": 25416 }, { "epoch": 0.69, "learning_rate": 4.518520478328963e-06, "loss": 1.3491, "step": 25417 }, { "epoch": 0.69, "learning_rate": 4.51778071441905e-06, "loss": 1.1643, "step": 25418 }, { "epoch": 0.69, "learning_rate": 4.5170409933994405e-06, "loss": 1.2266, "step": 25419 }, { "epoch": 0.69, "learning_rate": 4.516301315275927e-06, "loss": 1.2122, "step": 25420 }, { "epoch": 0.69, "learning_rate": 4.515561680054294e-06, "loss": 1.2563, "step": 25421 }, { "epoch": 0.69, "learning_rate": 4.5148220877403235e-06, "loss": 1.1853, "step": 25422 }, { "epoch": 0.69, "learning_rate": 4.51408253833981e-06, "loss": 1.1938, "step": 25423 }, { "epoch": 0.69, "learning_rate": 4.513343031858534e-06, "loss": 1.2776, "step": 25424 }, { "epoch": 0.69, "learning_rate": 4.512603568302283e-06, "loss": 1.3682, "step": 25425 }, { "epoch": 0.69, "learning_rate": 4.511864147676837e-06, "loss": 1.0828, "step": 25426 }, { "epoch": 0.69, "learning_rate": 4.5111247699879905e-06, "loss": 1.333, "step": 25427 }, { "epoch": 0.69, "learning_rate": 4.510385435241521e-06, "loss": 1.2273, "step": 25428 }, { "epoch": 0.69, "learning_rate": 4.509646143443214e-06, "loss": 1.3159, "step": 25429 }, { "epoch": 0.69, "learning_rate": 4.508906894598851e-06, "loss": 1.2402, "step": 25430 }, { "epoch": 0.69, "learning_rate": 4.508167688714223e-06, "loss": 1.4561, "step": 25431 }, { "epoch": 0.69, "learning_rate": 4.5074285257951076e-06, "loss": 1.2917, "step": 25432 }, { "epoch": 0.69, "learning_rate": 4.506689405847289e-06, "loss": 1.4229, "step": 25433 }, { "epoch": 0.69, "learning_rate": 4.505950328876545e-06, "loss": 1.1428, "step": 25434 }, { "epoch": 0.69, "learning_rate": 4.5052112948886665e-06, "loss": 1.3306, "step": 25435 }, { "epoch": 0.69, "learning_rate": 4.50447230388943e-06, "loss": 1.2307, "step": 25436 }, { "epoch": 0.69, "learning_rate": 4.5037333558846155e-06, "loss": 1.417, "step": 25437 }, { "epoch": 0.69, "learning_rate": 4.5029944508800095e-06, "loss": 1.3313, "step": 25438 }, { "epoch": 0.69, "learning_rate": 4.50225558888139e-06, "loss": 1.2463, "step": 25439 }, { "epoch": 0.69, "learning_rate": 4.501516769894538e-06, "loss": 1.2024, "step": 25440 }, { "epoch": 0.69, "learning_rate": 4.5007779939252305e-06, "loss": 1.2886, "step": 25441 }, { "epoch": 0.69, "learning_rate": 4.500039260979252e-06, "loss": 1.374, "step": 25442 }, { "epoch": 0.69, "learning_rate": 4.499300571062381e-06, "loss": 1.22, "step": 25443 }, { "epoch": 0.69, "learning_rate": 4.498561924180396e-06, "loss": 1.2534, "step": 25444 }, { "epoch": 0.69, "learning_rate": 4.497823320339071e-06, "loss": 1.2478, "step": 25445 }, { "epoch": 0.69, "learning_rate": 4.497084759544193e-06, "loss": 1.1813, "step": 25446 }, { "epoch": 0.69, "learning_rate": 4.496346241801537e-06, "loss": 1.4329, "step": 25447 }, { "epoch": 0.69, "learning_rate": 4.495607767116878e-06, "loss": 1.2561, "step": 25448 }, { "epoch": 0.69, "learning_rate": 4.494869335495994e-06, "loss": 1.248, "step": 25449 }, { "epoch": 0.7, "learning_rate": 4.494130946944663e-06, "loss": 1.2544, "step": 25450 }, { "epoch": 0.7, "learning_rate": 4.493392601468669e-06, "loss": 1.3547, "step": 25451 }, { "epoch": 0.7, "learning_rate": 4.492654299073775e-06, "loss": 1.2144, "step": 25452 }, { "epoch": 0.7, "learning_rate": 4.491916039765768e-06, "loss": 1.3179, "step": 25453 }, { "epoch": 0.7, "learning_rate": 4.4911778235504156e-06, "loss": 1.3528, "step": 25454 }, { "epoch": 0.7, "learning_rate": 4.490439650433505e-06, "loss": 1.3708, "step": 25455 }, { "epoch": 0.7, "learning_rate": 4.4897015204207975e-06, "loss": 1.3315, "step": 25456 }, { "epoch": 0.7, "learning_rate": 4.488963433518076e-06, "loss": 1.259, "step": 25457 }, { "epoch": 0.7, "learning_rate": 4.4882253897311116e-06, "loss": 1.0652, "step": 25458 }, { "epoch": 0.7, "learning_rate": 4.487487389065685e-06, "loss": 1.3638, "step": 25459 }, { "epoch": 0.7, "learning_rate": 4.486749431527559e-06, "loss": 1.1204, "step": 25460 }, { "epoch": 0.7, "learning_rate": 4.486011517122516e-06, "loss": 1.4043, "step": 25461 }, { "epoch": 0.7, "learning_rate": 4.4852736458563224e-06, "loss": 1.3124, "step": 25462 }, { "epoch": 0.7, "learning_rate": 4.4845358177347585e-06, "loss": 1.2578, "step": 25463 }, { "epoch": 0.7, "learning_rate": 4.483798032763593e-06, "loss": 1.1946, "step": 25464 }, { "epoch": 0.7, "learning_rate": 4.483060290948597e-06, "loss": 1.1895, "step": 25465 }, { "epoch": 0.7, "learning_rate": 4.482322592295541e-06, "loss": 1.3516, "step": 25466 }, { "epoch": 0.7, "learning_rate": 4.4815849368102006e-06, "loss": 1.3943, "step": 25467 }, { "epoch": 0.7, "learning_rate": 4.4808473244983456e-06, "loss": 1.2688, "step": 25468 }, { "epoch": 0.7, "learning_rate": 4.480109755365742e-06, "loss": 1.2974, "step": 25469 }, { "epoch": 0.7, "learning_rate": 4.479372229418167e-06, "loss": 1.2344, "step": 25470 }, { "epoch": 0.7, "learning_rate": 4.478634746661388e-06, "loss": 1.2998, "step": 25471 }, { "epoch": 0.7, "learning_rate": 4.477897307101174e-06, "loss": 1.1604, "step": 25472 }, { "epoch": 0.7, "learning_rate": 4.477159910743293e-06, "loss": 1.3433, "step": 25473 }, { "epoch": 0.7, "learning_rate": 4.476422557593517e-06, "loss": 1.4053, "step": 25474 }, { "epoch": 0.7, "learning_rate": 4.475685247657615e-06, "loss": 1.2717, "step": 25475 }, { "epoch": 0.7, "learning_rate": 4.474947980941354e-06, "loss": 1.3379, "step": 25476 }, { "epoch": 0.7, "learning_rate": 4.474210757450498e-06, "loss": 1.1904, "step": 25477 }, { "epoch": 0.7, "learning_rate": 4.473473577190822e-06, "loss": 1.3606, "step": 25478 }, { "epoch": 0.7, "learning_rate": 4.472736440168091e-06, "loss": 1.2087, "step": 25479 }, { "epoch": 0.7, "learning_rate": 4.4719993463880695e-06, "loss": 1.2288, "step": 25480 }, { "epoch": 0.7, "learning_rate": 4.471262295856522e-06, "loss": 1.4214, "step": 25481 }, { "epoch": 0.7, "learning_rate": 4.470525288579222e-06, "loss": 1.3748, "step": 25482 }, { "epoch": 0.7, "learning_rate": 4.469788324561935e-06, "loss": 1.3662, "step": 25483 }, { "epoch": 0.7, "learning_rate": 4.4690514038104175e-06, "loss": 1.2939, "step": 25484 }, { "epoch": 0.7, "learning_rate": 4.468314526330444e-06, "loss": 1.2354, "step": 25485 }, { "epoch": 0.7, "learning_rate": 4.467577692127778e-06, "loss": 1.334, "step": 25486 }, { "epoch": 0.7, "learning_rate": 4.466840901208181e-06, "loss": 1.2041, "step": 25487 }, { "epoch": 0.7, "learning_rate": 4.466104153577418e-06, "loss": 1.2512, "step": 25488 }, { "epoch": 0.7, "learning_rate": 4.465367449241255e-06, "loss": 1.0151, "step": 25489 }, { "epoch": 0.7, "learning_rate": 4.464630788205455e-06, "loss": 1.1316, "step": 25490 }, { "epoch": 0.7, "learning_rate": 4.463894170475781e-06, "loss": 1.2209, "step": 25491 }, { "epoch": 0.7, "learning_rate": 4.463157596057993e-06, "loss": 1.3215, "step": 25492 }, { "epoch": 0.7, "learning_rate": 4.46242106495786e-06, "loss": 1.3936, "step": 25493 }, { "epoch": 0.7, "learning_rate": 4.461684577181135e-06, "loss": 1.127, "step": 25494 }, { "epoch": 0.7, "learning_rate": 4.4609481327335945e-06, "loss": 1.3496, "step": 25495 }, { "epoch": 0.7, "learning_rate": 4.460211731620984e-06, "loss": 1.4392, "step": 25496 }, { "epoch": 0.7, "learning_rate": 4.459475373849071e-06, "loss": 1.3757, "step": 25497 }, { "epoch": 0.7, "learning_rate": 4.458739059423621e-06, "loss": 1.2993, "step": 25498 }, { "epoch": 0.7, "learning_rate": 4.458002788350392e-06, "loss": 1.312, "step": 25499 }, { "epoch": 0.7, "learning_rate": 4.457266560635142e-06, "loss": 1.3079, "step": 25500 }, { "epoch": 0.7, "learning_rate": 4.456530376283629e-06, "loss": 1.2588, "step": 25501 }, { "epoch": 0.7, "learning_rate": 4.455794235301618e-06, "loss": 1.2896, "step": 25502 }, { "epoch": 0.7, "learning_rate": 4.455058137694868e-06, "loss": 1.1206, "step": 25503 }, { "epoch": 0.7, "learning_rate": 4.454322083469135e-06, "loss": 1.4001, "step": 25504 }, { "epoch": 0.7, "learning_rate": 4.453586072630174e-06, "loss": 1.3291, "step": 25505 }, { "epoch": 0.7, "learning_rate": 4.452850105183751e-06, "loss": 1.2913, "step": 25506 }, { "epoch": 0.7, "learning_rate": 4.452114181135621e-06, "loss": 1.2117, "step": 25507 }, { "epoch": 0.7, "learning_rate": 4.45137830049154e-06, "loss": 1.2097, "step": 25508 }, { "epoch": 0.7, "learning_rate": 4.450642463257263e-06, "loss": 1.3867, "step": 25509 }, { "epoch": 0.7, "learning_rate": 4.449906669438554e-06, "loss": 1.2153, "step": 25510 }, { "epoch": 0.7, "learning_rate": 4.449170919041165e-06, "loss": 1.3003, "step": 25511 }, { "epoch": 0.7, "learning_rate": 4.448435212070848e-06, "loss": 1.2856, "step": 25512 }, { "epoch": 0.7, "learning_rate": 4.447699548533368e-06, "loss": 1.1444, "step": 25513 }, { "epoch": 0.7, "learning_rate": 4.446963928434476e-06, "loss": 1.1936, "step": 25514 }, { "epoch": 0.7, "learning_rate": 4.446228351779927e-06, "loss": 1.3064, "step": 25515 }, { "epoch": 0.7, "learning_rate": 4.445492818575471e-06, "loss": 1.4001, "step": 25516 }, { "epoch": 0.7, "learning_rate": 4.444757328826872e-06, "loss": 1.2312, "step": 25517 }, { "epoch": 0.7, "learning_rate": 4.444021882539878e-06, "loss": 1.3157, "step": 25518 }, { "epoch": 0.7, "learning_rate": 4.443286479720246e-06, "loss": 1.3044, "step": 25519 }, { "epoch": 0.7, "learning_rate": 4.442551120373724e-06, "loss": 1.2251, "step": 25520 }, { "epoch": 0.7, "learning_rate": 4.441815804506071e-06, "loss": 1.2761, "step": 25521 }, { "epoch": 0.7, "learning_rate": 4.441080532123037e-06, "loss": 1.2291, "step": 25522 }, { "epoch": 0.7, "learning_rate": 4.440345303230377e-06, "loss": 1.3359, "step": 25523 }, { "epoch": 0.7, "learning_rate": 4.439610117833837e-06, "loss": 1.3545, "step": 25524 }, { "epoch": 0.7, "learning_rate": 4.438874975939176e-06, "loss": 1.2441, "step": 25525 }, { "epoch": 0.7, "learning_rate": 4.4381398775521414e-06, "loss": 1.5874, "step": 25526 }, { "epoch": 0.7, "learning_rate": 4.437404822678486e-06, "loss": 1.3345, "step": 25527 }, { "epoch": 0.7, "learning_rate": 4.436669811323955e-06, "loss": 1.2391, "step": 25528 }, { "epoch": 0.7, "learning_rate": 4.435934843494304e-06, "loss": 1.1921, "step": 25529 }, { "epoch": 0.7, "learning_rate": 4.43519991919529e-06, "loss": 1.238, "step": 25530 }, { "epoch": 0.7, "learning_rate": 4.434465038432647e-06, "loss": 1.2097, "step": 25531 }, { "epoch": 0.7, "learning_rate": 4.433730201212136e-06, "loss": 1.3069, "step": 25532 }, { "epoch": 0.7, "learning_rate": 4.4329954075394995e-06, "loss": 1.2432, "step": 25533 }, { "epoch": 0.7, "learning_rate": 4.432260657420497e-06, "loss": 1.792, "step": 25534 }, { "epoch": 0.7, "learning_rate": 4.43152595086086e-06, "loss": 1.2288, "step": 25535 }, { "epoch": 0.7, "learning_rate": 4.430791287866351e-06, "loss": 1.1001, "step": 25536 }, { "epoch": 0.7, "learning_rate": 4.430056668442707e-06, "loss": 1.4187, "step": 25537 }, { "epoch": 0.7, "learning_rate": 4.429322092595688e-06, "loss": 1.1182, "step": 25538 }, { "epoch": 0.7, "learning_rate": 4.428587560331027e-06, "loss": 1.2222, "step": 25539 }, { "epoch": 0.7, "learning_rate": 4.42785307165448e-06, "loss": 1.3398, "step": 25540 }, { "epoch": 0.7, "learning_rate": 4.427118626571786e-06, "loss": 1.2029, "step": 25541 }, { "epoch": 0.7, "learning_rate": 4.426384225088703e-06, "loss": 1.3036, "step": 25542 }, { "epoch": 0.7, "learning_rate": 4.425649867210963e-06, "loss": 1.3142, "step": 25543 }, { "epoch": 0.7, "learning_rate": 4.424915552944316e-06, "loss": 1.2817, "step": 25544 }, { "epoch": 0.7, "learning_rate": 4.424181282294512e-06, "loss": 1.3657, "step": 25545 }, { "epoch": 0.7, "learning_rate": 4.423447055267291e-06, "loss": 1.3452, "step": 25546 }, { "epoch": 0.7, "learning_rate": 4.4227128718684e-06, "loss": 1.2964, "step": 25547 }, { "epoch": 0.7, "learning_rate": 4.421978732103576e-06, "loss": 1.4038, "step": 25548 }, { "epoch": 0.7, "learning_rate": 4.42124463597857e-06, "loss": 1.1873, "step": 25549 }, { "epoch": 0.7, "learning_rate": 4.420510583499124e-06, "loss": 1.2749, "step": 25550 }, { "epoch": 0.7, "learning_rate": 4.419776574670978e-06, "loss": 1.3716, "step": 25551 }, { "epoch": 0.7, "learning_rate": 4.419042609499875e-06, "loss": 1.3521, "step": 25552 }, { "epoch": 0.7, "learning_rate": 4.41830868799156e-06, "loss": 1.2932, "step": 25553 }, { "epoch": 0.7, "learning_rate": 4.417574810151774e-06, "loss": 1.2112, "step": 25554 }, { "epoch": 0.7, "learning_rate": 4.416840975986257e-06, "loss": 1.0754, "step": 25555 }, { "epoch": 0.7, "learning_rate": 4.416107185500747e-06, "loss": 1.2268, "step": 25556 }, { "epoch": 0.7, "learning_rate": 4.415373438700994e-06, "loss": 1.1072, "step": 25557 }, { "epoch": 0.7, "learning_rate": 4.4146397355927315e-06, "loss": 1.2852, "step": 25558 }, { "epoch": 0.7, "learning_rate": 4.413906076181698e-06, "loss": 1.3584, "step": 25559 }, { "epoch": 0.7, "learning_rate": 4.4131724604736405e-06, "loss": 1.1108, "step": 25560 }, { "epoch": 0.7, "learning_rate": 4.412438888474294e-06, "loss": 1.3093, "step": 25561 }, { "epoch": 0.7, "learning_rate": 4.411705360189399e-06, "loss": 1.1873, "step": 25562 }, { "epoch": 0.7, "learning_rate": 4.410971875624689e-06, "loss": 1.3169, "step": 25563 }, { "epoch": 0.7, "learning_rate": 4.41023843478591e-06, "loss": 1.3679, "step": 25564 }, { "epoch": 0.7, "learning_rate": 4.409505037678798e-06, "loss": 1.3455, "step": 25565 }, { "epoch": 0.7, "learning_rate": 4.40877168430909e-06, "loss": 1.3699, "step": 25566 }, { "epoch": 0.7, "learning_rate": 4.408038374682519e-06, "loss": 1.2629, "step": 25567 }, { "epoch": 0.7, "learning_rate": 4.40730510880483e-06, "loss": 1.3069, "step": 25568 }, { "epoch": 0.7, "learning_rate": 4.406571886681757e-06, "loss": 1.3857, "step": 25569 }, { "epoch": 0.7, "learning_rate": 4.405838708319034e-06, "loss": 1.2937, "step": 25570 }, { "epoch": 0.7, "learning_rate": 4.405105573722395e-06, "loss": 1.1433, "step": 25571 }, { "epoch": 0.7, "learning_rate": 4.404372482897582e-06, "loss": 1.229, "step": 25572 }, { "epoch": 0.7, "learning_rate": 4.403639435850328e-06, "loss": 1.4219, "step": 25573 }, { "epoch": 0.7, "learning_rate": 4.402906432586365e-06, "loss": 1.3601, "step": 25574 }, { "epoch": 0.7, "learning_rate": 4.402173473111433e-06, "loss": 1.2163, "step": 25575 }, { "epoch": 0.7, "learning_rate": 4.401440557431259e-06, "loss": 1.1069, "step": 25576 }, { "epoch": 0.7, "learning_rate": 4.4007076855515894e-06, "loss": 1.2048, "step": 25577 }, { "epoch": 0.7, "learning_rate": 4.399974857478143e-06, "loss": 1.1006, "step": 25578 }, { "epoch": 0.7, "learning_rate": 4.399242073216663e-06, "loss": 1.3386, "step": 25579 }, { "epoch": 0.7, "learning_rate": 4.398509332772876e-06, "loss": 1.4619, "step": 25580 }, { "epoch": 0.7, "learning_rate": 4.397776636152525e-06, "loss": 1.1139, "step": 25581 }, { "epoch": 0.7, "learning_rate": 4.397043983361328e-06, "loss": 1.3982, "step": 25582 }, { "epoch": 0.7, "learning_rate": 4.396311374405028e-06, "loss": 1.1394, "step": 25583 }, { "epoch": 0.7, "learning_rate": 4.395578809289349e-06, "loss": 1.2198, "step": 25584 }, { "epoch": 0.7, "learning_rate": 4.394846288020034e-06, "loss": 1.2615, "step": 25585 }, { "epoch": 0.7, "learning_rate": 4.394113810602798e-06, "loss": 1.2346, "step": 25586 }, { "epoch": 0.7, "learning_rate": 4.393381377043383e-06, "loss": 1.2502, "step": 25587 }, { "epoch": 0.7, "learning_rate": 4.392648987347512e-06, "loss": 1.3298, "step": 25588 }, { "epoch": 0.7, "learning_rate": 4.391916641520926e-06, "loss": 1.2324, "step": 25589 }, { "epoch": 0.7, "learning_rate": 4.39118433956934e-06, "loss": 1.124, "step": 25590 }, { "epoch": 0.7, "learning_rate": 4.39045208149849e-06, "loss": 1.2659, "step": 25591 }, { "epoch": 0.7, "learning_rate": 4.389719867314109e-06, "loss": 1.1694, "step": 25592 }, { "epoch": 0.7, "learning_rate": 4.388987697021922e-06, "loss": 1.2815, "step": 25593 }, { "epoch": 0.7, "learning_rate": 4.388255570627655e-06, "loss": 1.4399, "step": 25594 }, { "epoch": 0.7, "learning_rate": 4.387523488137037e-06, "loss": 1.2192, "step": 25595 }, { "epoch": 0.7, "learning_rate": 4.3867914495557975e-06, "loss": 1.2173, "step": 25596 }, { "epoch": 0.7, "learning_rate": 4.3860594548896615e-06, "loss": 1.3264, "step": 25597 }, { "epoch": 0.7, "learning_rate": 4.385327504144357e-06, "loss": 1.3169, "step": 25598 }, { "epoch": 0.7, "learning_rate": 4.384595597325608e-06, "loss": 1.2173, "step": 25599 }, { "epoch": 0.7, "learning_rate": 4.3838637344391455e-06, "loss": 1.2769, "step": 25600 }, { "epoch": 0.7, "learning_rate": 4.3831319154906915e-06, "loss": 1.1921, "step": 25601 }, { "epoch": 0.7, "learning_rate": 4.3824001404859714e-06, "loss": 1.2068, "step": 25602 }, { "epoch": 0.7, "learning_rate": 4.3816684094307095e-06, "loss": 1.1669, "step": 25603 }, { "epoch": 0.7, "learning_rate": 4.380936722330634e-06, "loss": 1.3481, "step": 25604 }, { "epoch": 0.7, "learning_rate": 4.380205079191467e-06, "loss": 1.3096, "step": 25605 }, { "epoch": 0.7, "learning_rate": 4.379473480018931e-06, "loss": 1.3528, "step": 25606 }, { "epoch": 0.7, "learning_rate": 4.378741924818755e-06, "loss": 1.3721, "step": 25607 }, { "epoch": 0.7, "learning_rate": 4.3780104135966574e-06, "loss": 1.2419, "step": 25608 }, { "epoch": 0.7, "learning_rate": 4.377278946358363e-06, "loss": 1.4436, "step": 25609 }, { "epoch": 0.7, "learning_rate": 4.376547523109591e-06, "loss": 1.2292, "step": 25610 }, { "epoch": 0.7, "learning_rate": 4.375816143856071e-06, "loss": 1.4009, "step": 25611 }, { "epoch": 0.7, "learning_rate": 4.37508480860352e-06, "loss": 1.2693, "step": 25612 }, { "epoch": 0.7, "learning_rate": 4.37435351735766e-06, "loss": 1.3113, "step": 25613 }, { "epoch": 0.7, "learning_rate": 4.37362227012421e-06, "loss": 1.1479, "step": 25614 }, { "epoch": 0.7, "learning_rate": 4.372891066908897e-06, "loss": 1.2583, "step": 25615 }, { "epoch": 0.7, "learning_rate": 4.372159907717438e-06, "loss": 1.2224, "step": 25616 }, { "epoch": 0.7, "learning_rate": 4.371428792555554e-06, "loss": 1.282, "step": 25617 }, { "epoch": 0.7, "learning_rate": 4.37069772142896e-06, "loss": 1.0911, "step": 25618 }, { "epoch": 0.7, "learning_rate": 4.369966694343385e-06, "loss": 1.2463, "step": 25619 }, { "epoch": 0.7, "learning_rate": 4.3692357113045415e-06, "loss": 1.1624, "step": 25620 }, { "epoch": 0.7, "learning_rate": 4.368504772318147e-06, "loss": 1.3157, "step": 25621 }, { "epoch": 0.7, "learning_rate": 4.367773877389927e-06, "loss": 1.2935, "step": 25622 }, { "epoch": 0.7, "learning_rate": 4.3670430265255914e-06, "loss": 1.252, "step": 25623 }, { "epoch": 0.7, "learning_rate": 4.36631221973087e-06, "loss": 1.3413, "step": 25624 }, { "epoch": 0.7, "learning_rate": 4.3655814570114664e-06, "loss": 1.1077, "step": 25625 }, { "epoch": 0.7, "learning_rate": 4.364850738373106e-06, "loss": 1.3823, "step": 25626 }, { "epoch": 0.7, "learning_rate": 4.364120063821501e-06, "loss": 1.2378, "step": 25627 }, { "epoch": 0.7, "learning_rate": 4.363389433362377e-06, "loss": 1.4175, "step": 25628 }, { "epoch": 0.7, "learning_rate": 4.3626588470014375e-06, "loss": 1.3228, "step": 25629 }, { "epoch": 0.7, "learning_rate": 4.361928304744407e-06, "loss": 1.4175, "step": 25630 }, { "epoch": 0.7, "learning_rate": 4.361197806596994e-06, "loss": 1.1792, "step": 25631 }, { "epoch": 0.7, "learning_rate": 4.360467352564926e-06, "loss": 1.2554, "step": 25632 }, { "epoch": 0.7, "learning_rate": 4.359736942653903e-06, "loss": 1.2969, "step": 25633 }, { "epoch": 0.7, "learning_rate": 4.359006576869647e-06, "loss": 1.6641, "step": 25634 }, { "epoch": 0.7, "learning_rate": 4.358276255217869e-06, "loss": 1.3374, "step": 25635 }, { "epoch": 0.7, "learning_rate": 4.35754597770429e-06, "loss": 1.23, "step": 25636 }, { "epoch": 0.7, "learning_rate": 4.356815744334615e-06, "loss": 1.281, "step": 25637 }, { "epoch": 0.7, "learning_rate": 4.356085555114558e-06, "loss": 1.2522, "step": 25638 }, { "epoch": 0.7, "learning_rate": 4.3553554100498365e-06, "loss": 1.4307, "step": 25639 }, { "epoch": 0.7, "learning_rate": 4.35462530914616e-06, "loss": 1.4844, "step": 25640 }, { "epoch": 0.7, "learning_rate": 4.3538952524092415e-06, "loss": 1.2744, "step": 25641 }, { "epoch": 0.7, "learning_rate": 4.3531652398447865e-06, "loss": 1.3362, "step": 25642 }, { "epoch": 0.7, "learning_rate": 4.3524352714585165e-06, "loss": 1.283, "step": 25643 }, { "epoch": 0.7, "learning_rate": 4.351705347256136e-06, "loss": 1.4053, "step": 25644 }, { "epoch": 0.7, "learning_rate": 4.350975467243358e-06, "loss": 1.2732, "step": 25645 }, { "epoch": 0.7, "learning_rate": 4.350245631425887e-06, "loss": 1.1978, "step": 25646 }, { "epoch": 0.7, "learning_rate": 4.349515839809441e-06, "loss": 1.21, "step": 25647 }, { "epoch": 0.7, "learning_rate": 4.348786092399726e-06, "loss": 1.3501, "step": 25648 }, { "epoch": 0.7, "learning_rate": 4.348056389202452e-06, "loss": 1.3562, "step": 25649 }, { "epoch": 0.7, "learning_rate": 4.347326730223324e-06, "loss": 1.3259, "step": 25650 }, { "epoch": 0.7, "learning_rate": 4.346597115468055e-06, "loss": 1.0575, "step": 25651 }, { "epoch": 0.7, "learning_rate": 4.345867544942354e-06, "loss": 1.303, "step": 25652 }, { "epoch": 0.7, "learning_rate": 4.345138018651921e-06, "loss": 1.2361, "step": 25653 }, { "epoch": 0.7, "learning_rate": 4.344408536602473e-06, "loss": 1.7954, "step": 25654 }, { "epoch": 0.7, "learning_rate": 4.343679098799715e-06, "loss": 1.2954, "step": 25655 }, { "epoch": 0.7, "learning_rate": 4.342949705249351e-06, "loss": 1.314, "step": 25656 }, { "epoch": 0.7, "learning_rate": 4.3422203559570845e-06, "loss": 1.2283, "step": 25657 }, { "epoch": 0.7, "learning_rate": 4.341491050928629e-06, "loss": 1.1494, "step": 25658 }, { "epoch": 0.7, "learning_rate": 4.340761790169687e-06, "loss": 1.1199, "step": 25659 }, { "epoch": 0.7, "learning_rate": 4.340032573685963e-06, "loss": 1.3257, "step": 25660 }, { "epoch": 0.7, "learning_rate": 4.3393034014831595e-06, "loss": 1.3108, "step": 25661 }, { "epoch": 0.7, "learning_rate": 4.338574273566988e-06, "loss": 1.2805, "step": 25662 }, { "epoch": 0.7, "learning_rate": 4.337845189943148e-06, "loss": 1.1462, "step": 25663 }, { "epoch": 0.7, "learning_rate": 4.337116150617346e-06, "loss": 1.415, "step": 25664 }, { "epoch": 0.7, "learning_rate": 4.336387155595281e-06, "loss": 1.2668, "step": 25665 }, { "epoch": 0.7, "learning_rate": 4.335658204882662e-06, "loss": 1.2236, "step": 25666 }, { "epoch": 0.7, "learning_rate": 4.334929298485191e-06, "loss": 1.2649, "step": 25667 }, { "epoch": 0.7, "learning_rate": 4.334200436408566e-06, "loss": 1.3562, "step": 25668 }, { "epoch": 0.7, "learning_rate": 4.333471618658495e-06, "loss": 1.1729, "step": 25669 }, { "epoch": 0.7, "learning_rate": 4.332742845240674e-06, "loss": 1.0505, "step": 25670 }, { "epoch": 0.7, "learning_rate": 4.332014116160815e-06, "loss": 1.3149, "step": 25671 }, { "epoch": 0.7, "learning_rate": 4.3312854314246055e-06, "loss": 1.2031, "step": 25672 }, { "epoch": 0.7, "learning_rate": 4.330556791037757e-06, "loss": 1.3364, "step": 25673 }, { "epoch": 0.7, "learning_rate": 4.329828195005962e-06, "loss": 1.4104, "step": 25674 }, { "epoch": 0.7, "learning_rate": 4.329099643334932e-06, "loss": 1.7051, "step": 25675 }, { "epoch": 0.7, "learning_rate": 4.328371136030353e-06, "loss": 1.3469, "step": 25676 }, { "epoch": 0.7, "learning_rate": 4.327642673097935e-06, "loss": 1.3669, "step": 25677 }, { "epoch": 0.7, "learning_rate": 4.326914254543369e-06, "loss": 1.2451, "step": 25678 }, { "epoch": 0.7, "learning_rate": 4.3261858803723665e-06, "loss": 1.1924, "step": 25679 }, { "epoch": 0.7, "learning_rate": 4.3254575505906105e-06, "loss": 1.3633, "step": 25680 }, { "epoch": 0.7, "learning_rate": 4.324729265203809e-06, "loss": 1.2524, "step": 25681 }, { "epoch": 0.7, "learning_rate": 4.3240010242176535e-06, "loss": 1.3096, "step": 25682 }, { "epoch": 0.7, "learning_rate": 4.323272827637849e-06, "loss": 1.0645, "step": 25683 }, { "epoch": 0.7, "learning_rate": 4.322544675470088e-06, "loss": 1.1692, "step": 25684 }, { "epoch": 0.7, "learning_rate": 4.321816567720064e-06, "loss": 1.1909, "step": 25685 }, { "epoch": 0.7, "learning_rate": 4.321088504393481e-06, "loss": 1.1865, "step": 25686 }, { "epoch": 0.7, "learning_rate": 4.3203604854960325e-06, "loss": 1.3606, "step": 25687 }, { "epoch": 0.7, "learning_rate": 4.319632511033411e-06, "loss": 1.2588, "step": 25688 }, { "epoch": 0.7, "learning_rate": 4.31890458101131e-06, "loss": 1.3264, "step": 25689 }, { "epoch": 0.7, "learning_rate": 4.318176695435433e-06, "loss": 1.2644, "step": 25690 }, { "epoch": 0.7, "learning_rate": 4.317448854311469e-06, "loss": 1.0991, "step": 25691 }, { "epoch": 0.7, "learning_rate": 4.316721057645113e-06, "loss": 1.2122, "step": 25692 }, { "epoch": 0.7, "learning_rate": 4.315993305442056e-06, "loss": 1.2183, "step": 25693 }, { "epoch": 0.7, "learning_rate": 4.315265597707997e-06, "loss": 1.2656, "step": 25694 }, { "epoch": 0.7, "learning_rate": 4.314537934448628e-06, "loss": 1.1741, "step": 25695 }, { "epoch": 0.7, "learning_rate": 4.31381031566964e-06, "loss": 1.3455, "step": 25696 }, { "epoch": 0.7, "learning_rate": 4.313082741376723e-06, "loss": 1.2422, "step": 25697 }, { "epoch": 0.7, "learning_rate": 4.312355211575575e-06, "loss": 1.4192, "step": 25698 }, { "epoch": 0.7, "learning_rate": 4.311627726271886e-06, "loss": 1.3186, "step": 25699 }, { "epoch": 0.7, "learning_rate": 4.310900285471345e-06, "loss": 1.3264, "step": 25700 }, { "epoch": 0.7, "learning_rate": 4.3101728891796464e-06, "loss": 1.2026, "step": 25701 }, { "epoch": 0.7, "learning_rate": 4.3094455374024805e-06, "loss": 1.272, "step": 25702 }, { "epoch": 0.7, "learning_rate": 4.3087182301455366e-06, "loss": 1.3496, "step": 25703 }, { "epoch": 0.7, "learning_rate": 4.307990967414501e-06, "loss": 1.3384, "step": 25704 }, { "epoch": 0.7, "learning_rate": 4.307263749215072e-06, "loss": 1.2981, "step": 25705 }, { "epoch": 0.7, "learning_rate": 4.306536575552933e-06, "loss": 1.2625, "step": 25706 }, { "epoch": 0.7, "learning_rate": 4.305809446433775e-06, "loss": 1.1191, "step": 25707 }, { "epoch": 0.7, "learning_rate": 4.3050823618632845e-06, "loss": 1.1985, "step": 25708 }, { "epoch": 0.7, "learning_rate": 4.304355321847153e-06, "loss": 1.2725, "step": 25709 }, { "epoch": 0.7, "learning_rate": 4.3036283263910686e-06, "loss": 1.3247, "step": 25710 }, { "epoch": 0.7, "learning_rate": 4.302901375500716e-06, "loss": 1.3423, "step": 25711 }, { "epoch": 0.7, "learning_rate": 4.302174469181782e-06, "loss": 1.3098, "step": 25712 }, { "epoch": 0.7, "learning_rate": 4.3014476074399595e-06, "loss": 1.1943, "step": 25713 }, { "epoch": 0.7, "learning_rate": 4.30072079028093e-06, "loss": 1.4082, "step": 25714 }, { "epoch": 0.7, "learning_rate": 4.299994017710378e-06, "loss": 1.1594, "step": 25715 }, { "epoch": 0.7, "learning_rate": 4.299267289733997e-06, "loss": 1.1953, "step": 25716 }, { "epoch": 0.7, "learning_rate": 4.298540606357463e-06, "loss": 1.2251, "step": 25717 }, { "epoch": 0.7, "learning_rate": 4.297813967586474e-06, "loss": 1.3027, "step": 25718 }, { "epoch": 0.7, "learning_rate": 4.2970873734267e-06, "loss": 1.3274, "step": 25719 }, { "epoch": 0.7, "learning_rate": 4.2963608238838365e-06, "loss": 1.2754, "step": 25720 }, { "epoch": 0.7, "learning_rate": 4.2956343189635595e-06, "loss": 1.2468, "step": 25721 }, { "epoch": 0.7, "learning_rate": 4.2949078586715655e-06, "loss": 1.3279, "step": 25722 }, { "epoch": 0.7, "learning_rate": 4.294181443013522e-06, "loss": 1.3413, "step": 25723 }, { "epoch": 0.7, "learning_rate": 4.293455071995123e-06, "loss": 1.1997, "step": 25724 }, { "epoch": 0.7, "learning_rate": 4.292728745622046e-06, "loss": 1.2737, "step": 25725 }, { "epoch": 0.7, "learning_rate": 4.292002463899977e-06, "loss": 1.304, "step": 25726 }, { "epoch": 0.7, "learning_rate": 4.2912762268345975e-06, "loss": 1.2363, "step": 25727 }, { "epoch": 0.7, "learning_rate": 4.2905500344315886e-06, "loss": 1.2754, "step": 25728 }, { "epoch": 0.7, "learning_rate": 4.289823886696628e-06, "loss": 1.1821, "step": 25729 }, { "epoch": 0.7, "learning_rate": 4.2890977836354046e-06, "loss": 1.4053, "step": 25730 }, { "epoch": 0.7, "learning_rate": 4.2883717252535925e-06, "loss": 1.1846, "step": 25731 }, { "epoch": 0.7, "learning_rate": 4.287645711556872e-06, "loss": 1.2986, "step": 25732 }, { "epoch": 0.7, "learning_rate": 4.286919742550929e-06, "loss": 1.2107, "step": 25733 }, { "epoch": 0.7, "learning_rate": 4.28619381824144e-06, "loss": 1.2764, "step": 25734 }, { "epoch": 0.7, "learning_rate": 4.285467938634082e-06, "loss": 1.0745, "step": 25735 }, { "epoch": 0.7, "learning_rate": 4.284742103734534e-06, "loss": 1.145, "step": 25736 }, { "epoch": 0.7, "learning_rate": 4.284016313548478e-06, "loss": 1.3298, "step": 25737 }, { "epoch": 0.7, "learning_rate": 4.283290568081592e-06, "loss": 1.2126, "step": 25738 }, { "epoch": 0.7, "learning_rate": 4.282564867339552e-06, "loss": 1.3984, "step": 25739 }, { "epoch": 0.7, "learning_rate": 4.281839211328032e-06, "loss": 1.1924, "step": 25740 }, { "epoch": 0.7, "learning_rate": 4.2811136000527165e-06, "loss": 1.1687, "step": 25741 }, { "epoch": 0.7, "learning_rate": 4.280388033519279e-06, "loss": 1.1736, "step": 25742 }, { "epoch": 0.7, "learning_rate": 4.279662511733397e-06, "loss": 1.1821, "step": 25743 }, { "epoch": 0.7, "learning_rate": 4.278937034700741e-06, "loss": 1.2549, "step": 25744 }, { "epoch": 0.7, "learning_rate": 4.2782116024269956e-06, "loss": 1.4094, "step": 25745 }, { "epoch": 0.7, "learning_rate": 4.277486214917832e-06, "loss": 1.3989, "step": 25746 }, { "epoch": 0.7, "learning_rate": 4.276760872178921e-06, "loss": 1.2041, "step": 25747 }, { "epoch": 0.7, "learning_rate": 4.276035574215947e-06, "loss": 1.1721, "step": 25748 }, { "epoch": 0.7, "learning_rate": 4.275310321034577e-06, "loss": 1.3022, "step": 25749 }, { "epoch": 0.7, "learning_rate": 4.274585112640488e-06, "loss": 1.1931, "step": 25750 }, { "epoch": 0.7, "learning_rate": 4.27385994903935e-06, "loss": 1.093, "step": 25751 }, { "epoch": 0.7, "learning_rate": 4.2731348302368416e-06, "loss": 1.1782, "step": 25752 }, { "epoch": 0.7, "learning_rate": 4.272409756238634e-06, "loss": 1.2637, "step": 25753 }, { "epoch": 0.7, "learning_rate": 4.271684727050399e-06, "loss": 1.2747, "step": 25754 }, { "epoch": 0.7, "learning_rate": 4.270959742677805e-06, "loss": 1.3325, "step": 25755 }, { "epoch": 0.7, "learning_rate": 4.270234803126532e-06, "loss": 1.2192, "step": 25756 }, { "epoch": 0.7, "learning_rate": 4.269509908402244e-06, "loss": 1.3171, "step": 25757 }, { "epoch": 0.7, "learning_rate": 4.268785058510623e-06, "loss": 1.1742, "step": 25758 }, { "epoch": 0.7, "learning_rate": 4.268060253457325e-06, "loss": 1.2827, "step": 25759 }, { "epoch": 0.7, "learning_rate": 4.2673354932480296e-06, "loss": 1.2283, "step": 25760 }, { "epoch": 0.7, "learning_rate": 4.266610777888407e-06, "loss": 1.4124, "step": 25761 }, { "epoch": 0.7, "learning_rate": 4.2658861073841275e-06, "loss": 1.2402, "step": 25762 }, { "epoch": 0.7, "learning_rate": 4.265161481740858e-06, "loss": 1.3608, "step": 25763 }, { "epoch": 0.7, "learning_rate": 4.264436900964265e-06, "loss": 1.2803, "step": 25764 }, { "epoch": 0.7, "learning_rate": 4.263712365060024e-06, "loss": 1.1501, "step": 25765 }, { "epoch": 0.7, "learning_rate": 4.2629878740338e-06, "loss": 1.3162, "step": 25766 }, { "epoch": 0.7, "learning_rate": 4.262263427891261e-06, "loss": 1.3257, "step": 25767 }, { "epoch": 0.7, "learning_rate": 4.261539026638072e-06, "loss": 1.1294, "step": 25768 }, { "epoch": 0.7, "learning_rate": 4.260814670279907e-06, "loss": 1.1194, "step": 25769 }, { "epoch": 0.7, "learning_rate": 4.260090358822428e-06, "loss": 1.271, "step": 25770 }, { "epoch": 0.7, "learning_rate": 4.259366092271304e-06, "loss": 1.2429, "step": 25771 }, { "epoch": 0.7, "learning_rate": 4.258641870632196e-06, "loss": 1.3181, "step": 25772 }, { "epoch": 0.7, "learning_rate": 4.257917693910778e-06, "loss": 1.2622, "step": 25773 }, { "epoch": 0.7, "learning_rate": 4.257193562112713e-06, "loss": 1.1833, "step": 25774 }, { "epoch": 0.7, "learning_rate": 4.256469475243663e-06, "loss": 1.2822, "step": 25775 }, { "epoch": 0.7, "learning_rate": 4.255745433309293e-06, "loss": 1.4126, "step": 25776 }, { "epoch": 0.7, "learning_rate": 4.255021436315272e-06, "loss": 1.2253, "step": 25777 }, { "epoch": 0.7, "learning_rate": 4.2542974842672625e-06, "loss": 1.2102, "step": 25778 }, { "epoch": 0.7, "learning_rate": 4.253573577170924e-06, "loss": 1.3545, "step": 25779 }, { "epoch": 0.7, "learning_rate": 4.252849715031928e-06, "loss": 1.2095, "step": 25780 }, { "epoch": 0.7, "learning_rate": 4.2521258978559324e-06, "loss": 1.1013, "step": 25781 }, { "epoch": 0.7, "learning_rate": 4.2514021256486016e-06, "loss": 1.0991, "step": 25782 }, { "epoch": 0.7, "learning_rate": 4.250678398415593e-06, "loss": 1.1819, "step": 25783 }, { "epoch": 0.7, "learning_rate": 4.249954716162577e-06, "loss": 1.1055, "step": 25784 }, { "epoch": 0.7, "learning_rate": 4.2492310788952115e-06, "loss": 1.2327, "step": 25785 }, { "epoch": 0.7, "learning_rate": 4.248507486619158e-06, "loss": 1.3223, "step": 25786 }, { "epoch": 0.7, "learning_rate": 4.247783939340073e-06, "loss": 1.1006, "step": 25787 }, { "epoch": 0.7, "learning_rate": 4.247060437063626e-06, "loss": 1.2927, "step": 25788 }, { "epoch": 0.7, "learning_rate": 4.246336979795473e-06, "loss": 1.2844, "step": 25789 }, { "epoch": 0.7, "learning_rate": 4.245613567541274e-06, "loss": 1.2571, "step": 25790 }, { "epoch": 0.7, "learning_rate": 4.244890200306684e-06, "loss": 1.3267, "step": 25791 }, { "epoch": 0.7, "learning_rate": 4.244166878097368e-06, "loss": 1.2961, "step": 25792 }, { "epoch": 0.7, "learning_rate": 4.243443600918991e-06, "loss": 1.1738, "step": 25793 }, { "epoch": 0.7, "learning_rate": 4.242720368777195e-06, "loss": 1.3462, "step": 25794 }, { "epoch": 0.7, "learning_rate": 4.241997181677654e-06, "loss": 1.3879, "step": 25795 }, { "epoch": 0.7, "learning_rate": 4.241274039626014e-06, "loss": 1.2463, "step": 25796 }, { "epoch": 0.7, "learning_rate": 4.240550942627946e-06, "loss": 1.1138, "step": 25797 }, { "epoch": 0.7, "learning_rate": 4.239827890689091e-06, "loss": 1.0876, "step": 25798 }, { "epoch": 0.7, "learning_rate": 4.239104883815118e-06, "loss": 1.2024, "step": 25799 }, { "epoch": 0.7, "learning_rate": 4.2383819220116766e-06, "loss": 1.1787, "step": 25800 }, { "epoch": 0.7, "learning_rate": 4.237659005284432e-06, "loss": 1.3857, "step": 25801 }, { "epoch": 0.7, "learning_rate": 4.236936133639027e-06, "loss": 1.3206, "step": 25802 }, { "epoch": 0.7, "learning_rate": 4.236213307081127e-06, "loss": 1.3049, "step": 25803 }, { "epoch": 0.7, "learning_rate": 4.2354905256163806e-06, "loss": 1.1953, "step": 25804 }, { "epoch": 0.7, "learning_rate": 4.234767789250452e-06, "loss": 1.1582, "step": 25805 }, { "epoch": 0.7, "learning_rate": 4.234045097988984e-06, "loss": 1.2915, "step": 25806 }, { "epoch": 0.7, "learning_rate": 4.2333224518376334e-06, "loss": 1.2356, "step": 25807 }, { "epoch": 0.7, "learning_rate": 4.2325998508020614e-06, "loss": 1.4431, "step": 25808 }, { "epoch": 0.7, "learning_rate": 4.231877294887915e-06, "loss": 1.1406, "step": 25809 }, { "epoch": 0.7, "learning_rate": 4.231154784100849e-06, "loss": 1.3364, "step": 25810 }, { "epoch": 0.7, "learning_rate": 4.2304323184465125e-06, "loss": 1.1484, "step": 25811 }, { "epoch": 0.7, "learning_rate": 4.229709897930563e-06, "loss": 1.2896, "step": 25812 }, { "epoch": 0.7, "learning_rate": 4.2289875225586495e-06, "loss": 1.1355, "step": 25813 }, { "epoch": 0.7, "learning_rate": 4.228265192336425e-06, "loss": 1.3657, "step": 25814 }, { "epoch": 0.7, "learning_rate": 4.227542907269535e-06, "loss": 1.3867, "step": 25815 }, { "epoch": 0.71, "learning_rate": 4.226820667363639e-06, "loss": 1.2593, "step": 25816 }, { "epoch": 0.71, "learning_rate": 4.226098472624384e-06, "loss": 1.2559, "step": 25817 }, { "epoch": 0.71, "learning_rate": 4.225376323057419e-06, "loss": 1.2529, "step": 25818 }, { "epoch": 0.71, "learning_rate": 4.22465421866839e-06, "loss": 1.1938, "step": 25819 }, { "epoch": 0.71, "learning_rate": 4.223932159462955e-06, "loss": 1.2893, "step": 25820 }, { "epoch": 0.71, "learning_rate": 4.223210145446758e-06, "loss": 1.2224, "step": 25821 }, { "epoch": 0.71, "learning_rate": 4.2224881766254475e-06, "loss": 1.075, "step": 25822 }, { "epoch": 0.71, "learning_rate": 4.221766253004671e-06, "loss": 1.387, "step": 25823 }, { "epoch": 0.71, "learning_rate": 4.2210443745900806e-06, "loss": 1.2869, "step": 25824 }, { "epoch": 0.71, "learning_rate": 4.220322541387323e-06, "loss": 1.281, "step": 25825 }, { "epoch": 0.71, "learning_rate": 4.219600753402039e-06, "loss": 1.2046, "step": 25826 }, { "epoch": 0.71, "learning_rate": 4.2188790106398845e-06, "loss": 1.2183, "step": 25827 }, { "epoch": 0.71, "learning_rate": 4.218157313106503e-06, "loss": 1.1035, "step": 25828 }, { "epoch": 0.71, "learning_rate": 4.217435660807538e-06, "loss": 1.3069, "step": 25829 }, { "epoch": 0.71, "learning_rate": 4.216714053748636e-06, "loss": 1.1899, "step": 25830 }, { "epoch": 0.71, "learning_rate": 4.215992491935445e-06, "loss": 1.3201, "step": 25831 }, { "epoch": 0.71, "learning_rate": 4.215270975373611e-06, "loss": 1.2468, "step": 25832 }, { "epoch": 0.71, "learning_rate": 4.214549504068776e-06, "loss": 1.2336, "step": 25833 }, { "epoch": 0.71, "learning_rate": 4.213828078026581e-06, "loss": 1.3928, "step": 25834 }, { "epoch": 0.71, "learning_rate": 4.213106697252679e-06, "loss": 1.3281, "step": 25835 }, { "epoch": 0.71, "learning_rate": 4.212385361752708e-06, "loss": 1.2097, "step": 25836 }, { "epoch": 0.71, "learning_rate": 4.211664071532313e-06, "loss": 1.3008, "step": 25837 }, { "epoch": 0.71, "learning_rate": 4.210942826597132e-06, "loss": 1.1824, "step": 25838 }, { "epoch": 0.71, "learning_rate": 4.210221626952813e-06, "loss": 1.2693, "step": 25839 }, { "epoch": 0.71, "learning_rate": 4.2095004726050036e-06, "loss": 1.1465, "step": 25840 }, { "epoch": 0.71, "learning_rate": 4.208779363559333e-06, "loss": 1.22, "step": 25841 }, { "epoch": 0.71, "learning_rate": 4.2080582998214534e-06, "loss": 1.4124, "step": 25842 }, { "epoch": 0.71, "learning_rate": 4.207337281396998e-06, "loss": 1.125, "step": 25843 }, { "epoch": 0.71, "learning_rate": 4.20661630829162e-06, "loss": 1.1855, "step": 25844 }, { "epoch": 0.71, "learning_rate": 4.205895380510943e-06, "loss": 1.1416, "step": 25845 }, { "epoch": 0.71, "learning_rate": 4.205174498060621e-06, "loss": 1.292, "step": 25846 }, { "epoch": 0.71, "learning_rate": 4.204453660946285e-06, "loss": 1.2703, "step": 25847 }, { "epoch": 0.71, "learning_rate": 4.203732869173585e-06, "loss": 1.3804, "step": 25848 }, { "epoch": 0.71, "learning_rate": 4.203012122748146e-06, "loss": 1.1553, "step": 25849 }, { "epoch": 0.71, "learning_rate": 4.2022914216756186e-06, "loss": 1.3513, "step": 25850 }, { "epoch": 0.71, "learning_rate": 4.2015707659616326e-06, "loss": 1.3152, "step": 25851 }, { "epoch": 0.71, "learning_rate": 4.200850155611838e-06, "loss": 1.3428, "step": 25852 }, { "epoch": 0.71, "learning_rate": 4.2001295906318576e-06, "loss": 1.22, "step": 25853 }, { "epoch": 0.71, "learning_rate": 4.199409071027335e-06, "loss": 1.0701, "step": 25854 }, { "epoch": 0.71, "learning_rate": 4.198688596803913e-06, "loss": 1.2024, "step": 25855 }, { "epoch": 0.71, "learning_rate": 4.197968167967222e-06, "loss": 1.4124, "step": 25856 }, { "epoch": 0.71, "learning_rate": 4.197247784522901e-06, "loss": 1.3511, "step": 25857 }, { "epoch": 0.71, "learning_rate": 4.196527446476582e-06, "loss": 1.3137, "step": 25858 }, { "epoch": 0.71, "learning_rate": 4.195807153833905e-06, "loss": 1.2788, "step": 25859 }, { "epoch": 0.71, "learning_rate": 4.195086906600504e-06, "loss": 1.186, "step": 25860 }, { "epoch": 0.71, "learning_rate": 4.194366704782013e-06, "loss": 1.345, "step": 25861 }, { "epoch": 0.71, "learning_rate": 4.193646548384064e-06, "loss": 1.2021, "step": 25862 }, { "epoch": 0.71, "learning_rate": 4.192926437412298e-06, "loss": 1.3384, "step": 25863 }, { "epoch": 0.71, "learning_rate": 4.192206371872344e-06, "loss": 1.3469, "step": 25864 }, { "epoch": 0.71, "learning_rate": 4.191486351769837e-06, "loss": 1.1617, "step": 25865 }, { "epoch": 0.71, "learning_rate": 4.190766377110406e-06, "loss": 1.2058, "step": 25866 }, { "epoch": 0.71, "learning_rate": 4.19004644789969e-06, "loss": 1.3242, "step": 25867 }, { "epoch": 0.71, "learning_rate": 4.189326564143319e-06, "loss": 1.3013, "step": 25868 }, { "epoch": 0.71, "learning_rate": 4.188606725846921e-06, "loss": 1.0645, "step": 25869 }, { "epoch": 0.71, "learning_rate": 4.187886933016134e-06, "loss": 1.209, "step": 25870 }, { "epoch": 0.71, "learning_rate": 4.187167185656588e-06, "loss": 1.3428, "step": 25871 }, { "epoch": 0.71, "learning_rate": 4.186447483773912e-06, "loss": 1.2937, "step": 25872 }, { "epoch": 0.71, "learning_rate": 4.185727827373734e-06, "loss": 1.3602, "step": 25873 }, { "epoch": 0.71, "learning_rate": 4.1850082164616905e-06, "loss": 1.0874, "step": 25874 }, { "epoch": 0.71, "learning_rate": 4.184288651043407e-06, "loss": 1.2, "step": 25875 }, { "epoch": 0.71, "learning_rate": 4.183569131124516e-06, "loss": 1.0163, "step": 25876 }, { "epoch": 0.71, "learning_rate": 4.182849656710642e-06, "loss": 1.2089, "step": 25877 }, { "epoch": 0.71, "learning_rate": 4.182130227807418e-06, "loss": 1.2957, "step": 25878 }, { "epoch": 0.71, "learning_rate": 4.181410844420473e-06, "loss": 1.2561, "step": 25879 }, { "epoch": 0.71, "learning_rate": 4.180691506555434e-06, "loss": 1.1448, "step": 25880 }, { "epoch": 0.71, "learning_rate": 4.179972214217925e-06, "loss": 1.3364, "step": 25881 }, { "epoch": 0.71, "learning_rate": 4.179252967413578e-06, "loss": 1.1727, "step": 25882 }, { "epoch": 0.71, "learning_rate": 4.17853376614802e-06, "loss": 1.28, "step": 25883 }, { "epoch": 0.71, "learning_rate": 4.177814610426877e-06, "loss": 1.1138, "step": 25884 }, { "epoch": 0.71, "learning_rate": 4.17709550025577e-06, "loss": 1.1588, "step": 25885 }, { "epoch": 0.71, "learning_rate": 4.17637643564033e-06, "loss": 1.3809, "step": 25886 }, { "epoch": 0.71, "learning_rate": 4.175657416586189e-06, "loss": 1.2866, "step": 25887 }, { "epoch": 0.71, "learning_rate": 4.174938443098959e-06, "loss": 1.2781, "step": 25888 }, { "epoch": 0.71, "learning_rate": 4.174219515184276e-06, "loss": 1.25, "step": 25889 }, { "epoch": 0.71, "learning_rate": 4.173500632847754e-06, "loss": 1.3579, "step": 25890 }, { "epoch": 0.71, "learning_rate": 4.1727817960950326e-06, "loss": 1.3408, "step": 25891 }, { "epoch": 0.71, "learning_rate": 4.172063004931718e-06, "loss": 1.2566, "step": 25892 }, { "epoch": 0.71, "learning_rate": 4.171344259363446e-06, "loss": 1.2952, "step": 25893 }, { "epoch": 0.71, "learning_rate": 4.1706255593958325e-06, "loss": 1.3906, "step": 25894 }, { "epoch": 0.71, "learning_rate": 4.1699069050345094e-06, "loss": 1.3083, "step": 25895 }, { "epoch": 0.71, "learning_rate": 4.169188296285087e-06, "loss": 1.3086, "step": 25896 }, { "epoch": 0.71, "learning_rate": 4.168469733153198e-06, "loss": 1.2993, "step": 25897 }, { "epoch": 0.71, "learning_rate": 4.167751215644455e-06, "loss": 1.3242, "step": 25898 }, { "epoch": 0.71, "learning_rate": 4.1670327437644895e-06, "loss": 1.2122, "step": 25899 }, { "epoch": 0.71, "learning_rate": 4.166314317518911e-06, "loss": 1.2676, "step": 25900 }, { "epoch": 0.71, "learning_rate": 4.165595936913347e-06, "loss": 1.3188, "step": 25901 }, { "epoch": 0.71, "learning_rate": 4.1648776019534195e-06, "loss": 1.1938, "step": 25902 }, { "epoch": 0.71, "learning_rate": 4.164159312644747e-06, "loss": 1.2988, "step": 25903 }, { "epoch": 0.71, "learning_rate": 4.163441068992947e-06, "loss": 1.3047, "step": 25904 }, { "epoch": 0.71, "learning_rate": 4.162722871003636e-06, "loss": 1.0056, "step": 25905 }, { "epoch": 0.71, "learning_rate": 4.16200471868244e-06, "loss": 1.2808, "step": 25906 }, { "epoch": 0.71, "learning_rate": 4.1612866120349736e-06, "loss": 1.2275, "step": 25907 }, { "epoch": 0.71, "learning_rate": 4.160568551066855e-06, "loss": 1.1318, "step": 25908 }, { "epoch": 0.71, "learning_rate": 4.159850535783699e-06, "loss": 1.2441, "step": 25909 }, { "epoch": 0.71, "learning_rate": 4.15913256619113e-06, "loss": 1.2776, "step": 25910 }, { "epoch": 0.71, "learning_rate": 4.15841464229476e-06, "loss": 1.21, "step": 25911 }, { "epoch": 0.71, "learning_rate": 4.157696764100209e-06, "loss": 1.6533, "step": 25912 }, { "epoch": 0.71, "learning_rate": 4.156978931613086e-06, "loss": 1.2976, "step": 25913 }, { "epoch": 0.71, "learning_rate": 4.156261144839017e-06, "loss": 1.2739, "step": 25914 }, { "epoch": 0.71, "learning_rate": 4.155543403783612e-06, "loss": 1.2566, "step": 25915 }, { "epoch": 0.71, "learning_rate": 4.154825708452483e-06, "loss": 1.2188, "step": 25916 }, { "epoch": 0.71, "learning_rate": 4.154108058851254e-06, "loss": 1.3005, "step": 25917 }, { "epoch": 0.71, "learning_rate": 4.153390454985534e-06, "loss": 1.6577, "step": 25918 }, { "epoch": 0.71, "learning_rate": 4.152672896860938e-06, "loss": 1.3105, "step": 25919 }, { "epoch": 0.71, "learning_rate": 4.151955384483077e-06, "loss": 1.3745, "step": 25920 }, { "epoch": 0.71, "learning_rate": 4.151237917857569e-06, "loss": 1.2488, "step": 25921 }, { "epoch": 0.71, "learning_rate": 4.150520496990026e-06, "loss": 1.2778, "step": 25922 }, { "epoch": 0.71, "learning_rate": 4.149803121886059e-06, "loss": 1.2998, "step": 25923 }, { "epoch": 0.71, "learning_rate": 4.1490857925512795e-06, "loss": 1.1553, "step": 25924 }, { "epoch": 0.71, "learning_rate": 4.148368508991304e-06, "loss": 1.1664, "step": 25925 }, { "epoch": 0.71, "learning_rate": 4.147651271211742e-06, "loss": 1.3235, "step": 25926 }, { "epoch": 0.71, "learning_rate": 4.146934079218205e-06, "loss": 1.3169, "step": 25927 }, { "epoch": 0.71, "learning_rate": 4.146216933016299e-06, "loss": 1.3416, "step": 25928 }, { "epoch": 0.71, "learning_rate": 4.145499832611642e-06, "loss": 1.0527, "step": 25929 }, { "epoch": 0.71, "learning_rate": 4.144782778009843e-06, "loss": 1.3328, "step": 25930 }, { "epoch": 0.71, "learning_rate": 4.144065769216506e-06, "loss": 1.2244, "step": 25931 }, { "epoch": 0.71, "learning_rate": 4.143348806237249e-06, "loss": 1.2429, "step": 25932 }, { "epoch": 0.71, "learning_rate": 4.142631889077672e-06, "loss": 1.2068, "step": 25933 }, { "epoch": 0.71, "learning_rate": 4.141915017743397e-06, "loss": 1.0691, "step": 25934 }, { "epoch": 0.71, "learning_rate": 4.141198192240017e-06, "loss": 1.2625, "step": 25935 }, { "epoch": 0.71, "learning_rate": 4.140481412573149e-06, "loss": 1.2795, "step": 25936 }, { "epoch": 0.71, "learning_rate": 4.139764678748398e-06, "loss": 1.7131, "step": 25937 }, { "epoch": 0.71, "learning_rate": 4.139047990771379e-06, "loss": 1.2285, "step": 25938 }, { "epoch": 0.71, "learning_rate": 4.138331348647685e-06, "loss": 1.27, "step": 25939 }, { "epoch": 0.71, "learning_rate": 4.1376147523829336e-06, "loss": 1.2937, "step": 25940 }, { "epoch": 0.71, "learning_rate": 4.136898201982725e-06, "loss": 1.1448, "step": 25941 }, { "epoch": 0.71, "learning_rate": 4.136181697452675e-06, "loss": 1.2534, "step": 25942 }, { "epoch": 0.71, "learning_rate": 4.1354652387983725e-06, "loss": 1.0883, "step": 25943 }, { "epoch": 0.71, "learning_rate": 4.134748826025438e-06, "loss": 1.0698, "step": 25944 }, { "epoch": 0.71, "learning_rate": 4.134032459139467e-06, "loss": 1.2195, "step": 25945 }, { "epoch": 0.71, "learning_rate": 4.133316138146075e-06, "loss": 1.4014, "step": 25946 }, { "epoch": 0.71, "learning_rate": 4.132599863050851e-06, "loss": 1.2725, "step": 25947 }, { "epoch": 0.71, "learning_rate": 4.131883633859407e-06, "loss": 1.4292, "step": 25948 }, { "epoch": 0.71, "learning_rate": 4.131167450577349e-06, "loss": 1.2822, "step": 25949 }, { "epoch": 0.71, "learning_rate": 4.130451313210277e-06, "loss": 1.3171, "step": 25950 }, { "epoch": 0.71, "learning_rate": 4.129735221763795e-06, "loss": 1.1333, "step": 25951 }, { "epoch": 0.71, "learning_rate": 4.129019176243501e-06, "loss": 1.1382, "step": 25952 }, { "epoch": 0.71, "learning_rate": 4.128303176655002e-06, "loss": 1.2654, "step": 25953 }, { "epoch": 0.71, "learning_rate": 4.1275872230039e-06, "loss": 1.0253, "step": 25954 }, { "epoch": 0.71, "learning_rate": 4.126871315295792e-06, "loss": 1.3645, "step": 25955 }, { "epoch": 0.71, "learning_rate": 4.126155453536279e-06, "loss": 1.104, "step": 25956 }, { "epoch": 0.71, "learning_rate": 4.125439637730967e-06, "loss": 1.2314, "step": 25957 }, { "epoch": 0.71, "learning_rate": 4.124723867885452e-06, "loss": 1.1965, "step": 25958 }, { "epoch": 0.71, "learning_rate": 4.124008144005335e-06, "loss": 1.2039, "step": 25959 }, { "epoch": 0.71, "learning_rate": 4.123292466096212e-06, "loss": 1.3037, "step": 25960 }, { "epoch": 0.71, "learning_rate": 4.122576834163689e-06, "loss": 1.1829, "step": 25961 }, { "epoch": 0.71, "learning_rate": 4.121861248213361e-06, "loss": 1.0858, "step": 25962 }, { "epoch": 0.71, "learning_rate": 4.121145708250823e-06, "loss": 1.3145, "step": 25963 }, { "epoch": 0.71, "learning_rate": 4.12043021428168e-06, "loss": 1.2522, "step": 25964 }, { "epoch": 0.71, "learning_rate": 4.119714766311525e-06, "loss": 1.2156, "step": 25965 }, { "epoch": 0.71, "learning_rate": 4.118999364345959e-06, "loss": 1.6724, "step": 25966 }, { "epoch": 0.71, "learning_rate": 4.118284008390572e-06, "loss": 1.2788, "step": 25967 }, { "epoch": 0.71, "learning_rate": 4.117568698450968e-06, "loss": 1.2908, "step": 25968 }, { "epoch": 0.71, "learning_rate": 4.11685343453274e-06, "loss": 1.1069, "step": 25969 }, { "epoch": 0.71, "learning_rate": 4.116138216641485e-06, "loss": 1.3633, "step": 25970 }, { "epoch": 0.71, "learning_rate": 4.1154230447827946e-06, "loss": 1.1367, "step": 25971 }, { "epoch": 0.71, "learning_rate": 4.114707918962271e-06, "loss": 1.3347, "step": 25972 }, { "epoch": 0.71, "learning_rate": 4.113992839185504e-06, "loss": 1.2373, "step": 25973 }, { "epoch": 0.71, "learning_rate": 4.113277805458091e-06, "loss": 1.1901, "step": 25974 }, { "epoch": 0.71, "learning_rate": 4.112562817785619e-06, "loss": 1.385, "step": 25975 }, { "epoch": 0.71, "learning_rate": 4.1118478761736915e-06, "loss": 1.3215, "step": 25976 }, { "epoch": 0.71, "learning_rate": 4.111132980627896e-06, "loss": 1.1961, "step": 25977 }, { "epoch": 0.71, "learning_rate": 4.110418131153826e-06, "loss": 1.3521, "step": 25978 }, { "epoch": 0.71, "learning_rate": 4.109703327757076e-06, "loss": 1.2439, "step": 25979 }, { "epoch": 0.71, "learning_rate": 4.108988570443235e-06, "loss": 1.1226, "step": 25980 }, { "epoch": 0.71, "learning_rate": 4.108273859217905e-06, "loss": 1.2078, "step": 25981 }, { "epoch": 0.71, "learning_rate": 4.107559194086662e-06, "loss": 1.3289, "step": 25982 }, { "epoch": 0.71, "learning_rate": 4.106844575055109e-06, "loss": 1.1086, "step": 25983 }, { "epoch": 0.71, "learning_rate": 4.106130002128828e-06, "loss": 1.293, "step": 25984 }, { "epoch": 0.71, "learning_rate": 4.105415475313423e-06, "loss": 1.0955, "step": 25985 }, { "epoch": 0.71, "learning_rate": 4.104700994614468e-06, "loss": 1.3367, "step": 25986 }, { "epoch": 0.71, "learning_rate": 4.103986560037564e-06, "loss": 1.1919, "step": 25987 }, { "epoch": 0.71, "learning_rate": 4.1032721715882925e-06, "loss": 1.2954, "step": 25988 }, { "epoch": 0.71, "learning_rate": 4.1025578292722505e-06, "loss": 1.3525, "step": 25989 }, { "epoch": 0.71, "learning_rate": 4.101843533095022e-06, "loss": 1.3223, "step": 25990 }, { "epoch": 0.71, "learning_rate": 4.1011292830621985e-06, "loss": 1.3335, "step": 25991 }, { "epoch": 0.71, "learning_rate": 4.100415079179361e-06, "loss": 1.2415, "step": 25992 }, { "epoch": 0.71, "learning_rate": 4.099700921452104e-06, "loss": 1.3682, "step": 25993 }, { "epoch": 0.71, "learning_rate": 4.098986809886013e-06, "loss": 1.1963, "step": 25994 }, { "epoch": 0.71, "learning_rate": 4.098272744486672e-06, "loss": 1.2371, "step": 25995 }, { "epoch": 0.71, "learning_rate": 4.097558725259673e-06, "loss": 1.3391, "step": 25996 }, { "epoch": 0.71, "learning_rate": 4.096844752210598e-06, "loss": 1.2148, "step": 25997 }, { "epoch": 0.71, "learning_rate": 4.096130825345035e-06, "loss": 1.2861, "step": 25998 }, { "epoch": 0.71, "learning_rate": 4.095416944668563e-06, "loss": 1.2942, "step": 25999 }, { "epoch": 0.71, "learning_rate": 4.094703110186777e-06, "loss": 1.2598, "step": 26000 }, { "epoch": 0.71, "learning_rate": 4.093989321905257e-06, "loss": 1.3486, "step": 26001 }, { "epoch": 0.71, "learning_rate": 4.093275579829587e-06, "loss": 1.2537, "step": 26002 }, { "epoch": 0.71, "learning_rate": 4.092561883965349e-06, "loss": 1.2307, "step": 26003 }, { "epoch": 0.71, "learning_rate": 4.091848234318132e-06, "loss": 1.3418, "step": 26004 }, { "epoch": 0.71, "learning_rate": 4.091134630893515e-06, "loss": 1.3462, "step": 26005 }, { "epoch": 0.71, "learning_rate": 4.090421073697083e-06, "loss": 1.2842, "step": 26006 }, { "epoch": 0.71, "learning_rate": 4.089707562734414e-06, "loss": 1.3813, "step": 26007 }, { "epoch": 0.71, "learning_rate": 4.0889940980110975e-06, "loss": 1.2053, "step": 26008 }, { "epoch": 0.71, "learning_rate": 4.088280679532711e-06, "loss": 1.3606, "step": 26009 }, { "epoch": 0.71, "learning_rate": 4.087567307304834e-06, "loss": 1.4028, "step": 26010 }, { "epoch": 0.71, "learning_rate": 4.086853981333053e-06, "loss": 1.2874, "step": 26011 }, { "epoch": 0.71, "learning_rate": 4.086140701622947e-06, "loss": 1.1204, "step": 26012 }, { "epoch": 0.71, "learning_rate": 4.0854274681800944e-06, "loss": 1.3162, "step": 26013 }, { "epoch": 0.71, "learning_rate": 4.084714281010072e-06, "loss": 1.2197, "step": 26014 }, { "epoch": 0.71, "learning_rate": 4.084001140118467e-06, "loss": 1.3242, "step": 26015 }, { "epoch": 0.71, "learning_rate": 4.083288045510856e-06, "loss": 1.323, "step": 26016 }, { "epoch": 0.71, "learning_rate": 4.082574997192817e-06, "loss": 1.2617, "step": 26017 }, { "epoch": 0.71, "learning_rate": 4.081861995169924e-06, "loss": 1.1768, "step": 26018 }, { "epoch": 0.71, "learning_rate": 4.081149039447765e-06, "loss": 1.6035, "step": 26019 }, { "epoch": 0.71, "learning_rate": 4.080436130031913e-06, "loss": 1.2583, "step": 26020 }, { "epoch": 0.71, "learning_rate": 4.079723266927944e-06, "loss": 1.4551, "step": 26021 }, { "epoch": 0.71, "learning_rate": 4.0790104501414315e-06, "loss": 1.3184, "step": 26022 }, { "epoch": 0.71, "learning_rate": 4.078297679677963e-06, "loss": 1.2073, "step": 26023 }, { "epoch": 0.71, "learning_rate": 4.0775849555431034e-06, "loss": 1.157, "step": 26024 }, { "epoch": 0.71, "learning_rate": 4.07687227774244e-06, "loss": 1.0535, "step": 26025 }, { "epoch": 0.71, "learning_rate": 4.07615964628154e-06, "loss": 1.3232, "step": 26026 }, { "epoch": 0.71, "learning_rate": 4.075447061165979e-06, "loss": 1.1028, "step": 26027 }, { "epoch": 0.71, "learning_rate": 4.0747345224013376e-06, "loss": 1.2808, "step": 26028 }, { "epoch": 0.71, "learning_rate": 4.074022029993187e-06, "loss": 1.1992, "step": 26029 }, { "epoch": 0.71, "learning_rate": 4.0733095839471024e-06, "loss": 1.1326, "step": 26030 }, { "epoch": 0.71, "learning_rate": 4.072597184268653e-06, "loss": 1.3372, "step": 26031 }, { "epoch": 0.71, "learning_rate": 4.071884830963419e-06, "loss": 1.248, "step": 26032 }, { "epoch": 0.71, "learning_rate": 4.07117252403697e-06, "loss": 1.2173, "step": 26033 }, { "epoch": 0.71, "learning_rate": 4.07046026349488e-06, "loss": 1.0991, "step": 26034 }, { "epoch": 0.71, "learning_rate": 4.069748049342717e-06, "loss": 1.3948, "step": 26035 }, { "epoch": 0.71, "learning_rate": 4.06903588158606e-06, "loss": 1.162, "step": 26036 }, { "epoch": 0.71, "learning_rate": 4.068323760230477e-06, "loss": 1.2444, "step": 26037 }, { "epoch": 0.71, "learning_rate": 4.067611685281539e-06, "loss": 1.2324, "step": 26038 }, { "epoch": 0.71, "learning_rate": 4.066899656744816e-06, "loss": 1.7642, "step": 26039 }, { "epoch": 0.71, "learning_rate": 4.066187674625882e-06, "loss": 1.1914, "step": 26040 }, { "epoch": 0.71, "learning_rate": 4.065475738930307e-06, "loss": 1.1655, "step": 26041 }, { "epoch": 0.71, "learning_rate": 4.064763849663655e-06, "loss": 1.2292, "step": 26042 }, { "epoch": 0.71, "learning_rate": 4.064052006831501e-06, "loss": 1.3623, "step": 26043 }, { "epoch": 0.71, "learning_rate": 4.063340210439416e-06, "loss": 1.4248, "step": 26044 }, { "epoch": 0.71, "learning_rate": 4.062628460492964e-06, "loss": 1.2864, "step": 26045 }, { "epoch": 0.71, "learning_rate": 4.061916756997711e-06, "loss": 1.219, "step": 26046 }, { "epoch": 0.71, "learning_rate": 4.0612050999592345e-06, "loss": 1.1855, "step": 26047 }, { "epoch": 0.71, "learning_rate": 4.060493489383095e-06, "loss": 1.2815, "step": 26048 }, { "epoch": 0.71, "learning_rate": 4.059781925274861e-06, "loss": 1.21, "step": 26049 }, { "epoch": 0.71, "learning_rate": 4.059070407640099e-06, "loss": 1.1748, "step": 26050 }, { "epoch": 0.71, "learning_rate": 4.0583589364843776e-06, "loss": 1.3318, "step": 26051 }, { "epoch": 0.71, "learning_rate": 4.057647511813263e-06, "loss": 1.1978, "step": 26052 }, { "epoch": 0.71, "learning_rate": 4.05693613363232e-06, "loss": 1.3779, "step": 26053 }, { "epoch": 0.71, "learning_rate": 4.05622480194711e-06, "loss": 1.1826, "step": 26054 }, { "epoch": 0.71, "learning_rate": 4.055513516763202e-06, "loss": 1.748, "step": 26055 }, { "epoch": 0.71, "learning_rate": 4.054802278086168e-06, "loss": 1.3347, "step": 26056 }, { "epoch": 0.71, "learning_rate": 4.05409108592156e-06, "loss": 1.252, "step": 26057 }, { "epoch": 0.71, "learning_rate": 4.053379940274948e-06, "loss": 1.188, "step": 26058 }, { "epoch": 0.71, "learning_rate": 4.052668841151894e-06, "loss": 1.3647, "step": 26059 }, { "epoch": 0.71, "learning_rate": 4.051957788557969e-06, "loss": 1.196, "step": 26060 }, { "epoch": 0.71, "learning_rate": 4.051246782498721e-06, "loss": 1.2974, "step": 26061 }, { "epoch": 0.71, "learning_rate": 4.050535822979725e-06, "loss": 1.3101, "step": 26062 }, { "epoch": 0.71, "learning_rate": 4.049824910006537e-06, "loss": 1.3103, "step": 26063 }, { "epoch": 0.71, "learning_rate": 4.0491140435847265e-06, "loss": 1.4363, "step": 26064 }, { "epoch": 0.71, "learning_rate": 4.048403223719842e-06, "loss": 1.1455, "step": 26065 }, { "epoch": 0.71, "learning_rate": 4.0476924504174565e-06, "loss": 1.3103, "step": 26066 }, { "epoch": 0.71, "learning_rate": 4.046981723683122e-06, "loss": 1.3682, "step": 26067 }, { "epoch": 0.71, "learning_rate": 4.046271043522412e-06, "loss": 1.3118, "step": 26068 }, { "epoch": 0.71, "learning_rate": 4.045560409940869e-06, "loss": 1.6768, "step": 26069 }, { "epoch": 0.71, "learning_rate": 4.044849822944064e-06, "loss": 1.3755, "step": 26070 }, { "epoch": 0.71, "learning_rate": 4.0441392825375525e-06, "loss": 1.2944, "step": 26071 }, { "epoch": 0.71, "learning_rate": 4.043428788726897e-06, "loss": 1.3984, "step": 26072 }, { "epoch": 0.71, "learning_rate": 4.042718341517654e-06, "loss": 1.3105, "step": 26073 }, { "epoch": 0.71, "learning_rate": 4.0420079409153775e-06, "loss": 1.2439, "step": 26074 }, { "epoch": 0.71, "learning_rate": 4.0412975869256335e-06, "loss": 1.3882, "step": 26075 }, { "epoch": 0.71, "learning_rate": 4.040587279553974e-06, "loss": 1.6816, "step": 26076 }, { "epoch": 0.71, "learning_rate": 4.039877018805958e-06, "loss": 1.3015, "step": 26077 }, { "epoch": 0.71, "learning_rate": 4.039166804687138e-06, "loss": 1.2433, "step": 26078 }, { "epoch": 0.71, "learning_rate": 4.038456637203077e-06, "loss": 1.1545, "step": 26079 }, { "epoch": 0.71, "learning_rate": 4.037746516359328e-06, "loss": 1.3657, "step": 26080 }, { "epoch": 0.71, "learning_rate": 4.037036442161447e-06, "loss": 1.1575, "step": 26081 }, { "epoch": 0.71, "learning_rate": 4.036326414614985e-06, "loss": 1.178, "step": 26082 }, { "epoch": 0.71, "learning_rate": 4.0356164337255055e-06, "loss": 1.2583, "step": 26083 }, { "epoch": 0.71, "learning_rate": 4.034906499498558e-06, "loss": 1.317, "step": 26084 }, { "epoch": 0.71, "learning_rate": 4.034196611939696e-06, "loss": 1.3103, "step": 26085 }, { "epoch": 0.71, "learning_rate": 4.033486771054471e-06, "loss": 1.3062, "step": 26086 }, { "epoch": 0.71, "learning_rate": 4.032776976848443e-06, "loss": 1.2141, "step": 26087 }, { "epoch": 0.71, "learning_rate": 4.0320672293271634e-06, "loss": 1.3657, "step": 26088 }, { "epoch": 0.71, "learning_rate": 4.031357528496179e-06, "loss": 1.2175, "step": 26089 }, { "epoch": 0.71, "learning_rate": 4.030647874361051e-06, "loss": 1.3477, "step": 26090 }, { "epoch": 0.71, "learning_rate": 4.0299382669273264e-06, "loss": 1.3535, "step": 26091 }, { "epoch": 0.71, "learning_rate": 4.029228706200557e-06, "loss": 1.1174, "step": 26092 }, { "epoch": 0.71, "learning_rate": 4.028519192186292e-06, "loss": 1.6226, "step": 26093 }, { "epoch": 0.71, "learning_rate": 4.027809724890088e-06, "loss": 1.3179, "step": 26094 }, { "epoch": 0.71, "learning_rate": 4.027100304317493e-06, "loss": 1.2615, "step": 26095 }, { "epoch": 0.71, "learning_rate": 4.0263909304740556e-06, "loss": 1.2637, "step": 26096 }, { "epoch": 0.71, "learning_rate": 4.025681603365323e-06, "loss": 1.3115, "step": 26097 }, { "epoch": 0.71, "learning_rate": 4.0249723229968525e-06, "loss": 1.2759, "step": 26098 }, { "epoch": 0.71, "learning_rate": 4.024263089374189e-06, "loss": 1.2632, "step": 26099 }, { "epoch": 0.71, "learning_rate": 4.02355390250288e-06, "loss": 1.1519, "step": 26100 }, { "epoch": 0.71, "learning_rate": 4.022844762388472e-06, "loss": 1.2891, "step": 26101 }, { "epoch": 0.71, "learning_rate": 4.022135669036516e-06, "loss": 1.2861, "step": 26102 }, { "epoch": 0.71, "learning_rate": 4.021426622452567e-06, "loss": 1.2, "step": 26103 }, { "epoch": 0.71, "learning_rate": 4.020717622642158e-06, "loss": 1.313, "step": 26104 }, { "epoch": 0.71, "learning_rate": 4.020008669610845e-06, "loss": 1.3267, "step": 26105 }, { "epoch": 0.71, "learning_rate": 4.01929976336417e-06, "loss": 1.2759, "step": 26106 }, { "epoch": 0.71, "learning_rate": 4.018590903907686e-06, "loss": 1.6401, "step": 26107 }, { "epoch": 0.71, "learning_rate": 4.017882091246929e-06, "loss": 1.3162, "step": 26108 }, { "epoch": 0.71, "learning_rate": 4.017173325387452e-06, "loss": 1.218, "step": 26109 }, { "epoch": 0.71, "learning_rate": 4.016464606334796e-06, "loss": 1.3096, "step": 26110 }, { "epoch": 0.71, "learning_rate": 4.015755934094513e-06, "loss": 1.3303, "step": 26111 }, { "epoch": 0.71, "learning_rate": 4.015047308672134e-06, "loss": 1.2944, "step": 26112 }, { "epoch": 0.71, "learning_rate": 4.014338730073215e-06, "loss": 1.2639, "step": 26113 }, { "epoch": 0.71, "learning_rate": 4.013630198303291e-06, "loss": 1.1572, "step": 26114 }, { "epoch": 0.71, "learning_rate": 4.012921713367917e-06, "loss": 1.3643, "step": 26115 }, { "epoch": 0.71, "learning_rate": 4.01221327527262e-06, "loss": 1.4062, "step": 26116 }, { "epoch": 0.71, "learning_rate": 4.011504884022952e-06, "loss": 1.448, "step": 26117 }, { "epoch": 0.71, "learning_rate": 4.0107965396244564e-06, "loss": 1.2424, "step": 26118 }, { "epoch": 0.71, "learning_rate": 4.010088242082672e-06, "loss": 1.2996, "step": 26119 }, { "epoch": 0.71, "learning_rate": 4.009379991403142e-06, "loss": 1.2837, "step": 26120 }, { "epoch": 0.71, "learning_rate": 4.0086717875914015e-06, "loss": 1.2544, "step": 26121 }, { "epoch": 0.71, "learning_rate": 4.007963630652999e-06, "loss": 1.2437, "step": 26122 }, { "epoch": 0.71, "learning_rate": 4.007255520593471e-06, "loss": 1.325, "step": 26123 }, { "epoch": 0.71, "learning_rate": 4.006547457418359e-06, "loss": 1.2239, "step": 26124 }, { "epoch": 0.71, "learning_rate": 4.005839441133198e-06, "loss": 1.2876, "step": 26125 }, { "epoch": 0.71, "learning_rate": 4.005131471743533e-06, "loss": 1.3794, "step": 26126 }, { "epoch": 0.71, "learning_rate": 4.004423549254901e-06, "loss": 1.311, "step": 26127 }, { "epoch": 0.71, "learning_rate": 4.00371567367284e-06, "loss": 1.3723, "step": 26128 }, { "epoch": 0.71, "learning_rate": 4.003007845002884e-06, "loss": 1.3816, "step": 26129 }, { "epoch": 0.71, "learning_rate": 4.002300063250578e-06, "loss": 1.2671, "step": 26130 }, { "epoch": 0.71, "learning_rate": 4.0015923284214566e-06, "loss": 1.1919, "step": 26131 }, { "epoch": 0.71, "learning_rate": 4.000884640521055e-06, "loss": 1.3313, "step": 26132 }, { "epoch": 0.71, "learning_rate": 4.000176999554909e-06, "loss": 1.2749, "step": 26133 }, { "epoch": 0.71, "learning_rate": 3.999469405528559e-06, "loss": 1.2412, "step": 26134 }, { "epoch": 0.71, "learning_rate": 3.998761858447539e-06, "loss": 1.201, "step": 26135 }, { "epoch": 0.71, "learning_rate": 3.998054358317381e-06, "loss": 1.0757, "step": 26136 }, { "epoch": 0.71, "learning_rate": 3.997346905143627e-06, "loss": 1.3179, "step": 26137 }, { "epoch": 0.71, "learning_rate": 3.996639498931809e-06, "loss": 1.3357, "step": 26138 }, { "epoch": 0.71, "learning_rate": 3.9959321396874595e-06, "loss": 1.2761, "step": 26139 }, { "epoch": 0.71, "learning_rate": 3.99522482741611e-06, "loss": 1.2837, "step": 26140 }, { "epoch": 0.71, "learning_rate": 3.994517562123302e-06, "loss": 1.146, "step": 26141 }, { "epoch": 0.71, "learning_rate": 3.993810343814563e-06, "loss": 1.1533, "step": 26142 }, { "epoch": 0.71, "learning_rate": 3.99310317249543e-06, "loss": 1.2258, "step": 26143 }, { "epoch": 0.71, "learning_rate": 3.992396048171429e-06, "loss": 1.3054, "step": 26144 }, { "epoch": 0.71, "learning_rate": 3.991688970848099e-06, "loss": 1.3367, "step": 26145 }, { "epoch": 0.71, "learning_rate": 3.990981940530969e-06, "loss": 1.4102, "step": 26146 }, { "epoch": 0.71, "learning_rate": 3.990274957225572e-06, "loss": 1.2136, "step": 26147 }, { "epoch": 0.71, "learning_rate": 3.989568020937433e-06, "loss": 1.2148, "step": 26148 }, { "epoch": 0.71, "learning_rate": 3.988861131672087e-06, "loss": 1.2395, "step": 26149 }, { "epoch": 0.71, "learning_rate": 3.988154289435073e-06, "loss": 1.1609, "step": 26150 }, { "epoch": 0.71, "learning_rate": 3.9874474942319065e-06, "loss": 1.3718, "step": 26151 }, { "epoch": 0.71, "learning_rate": 3.986740746068125e-06, "loss": 1.0935, "step": 26152 }, { "epoch": 0.71, "learning_rate": 3.9860340449492544e-06, "loss": 1.2654, "step": 26153 }, { "epoch": 0.71, "learning_rate": 3.985327390880832e-06, "loss": 1.0901, "step": 26154 }, { "epoch": 0.71, "learning_rate": 3.984620783868373e-06, "loss": 1.4324, "step": 26155 }, { "epoch": 0.71, "learning_rate": 3.983914223917415e-06, "loss": 1.2549, "step": 26156 }, { "epoch": 0.71, "learning_rate": 3.983207711033481e-06, "loss": 1.2383, "step": 26157 }, { "epoch": 0.71, "learning_rate": 3.982501245222107e-06, "loss": 1.2766, "step": 26158 }, { "epoch": 0.71, "learning_rate": 3.981794826488806e-06, "loss": 1.2583, "step": 26159 }, { "epoch": 0.71, "learning_rate": 3.981088454839116e-06, "loss": 1.3018, "step": 26160 }, { "epoch": 0.71, "learning_rate": 3.980382130278557e-06, "loss": 1.1169, "step": 26161 }, { "epoch": 0.71, "learning_rate": 3.979675852812665e-06, "loss": 1.2632, "step": 26162 }, { "epoch": 0.71, "learning_rate": 3.9789696224469484e-06, "loss": 1.186, "step": 26163 }, { "epoch": 0.71, "learning_rate": 3.978263439186945e-06, "loss": 1.2563, "step": 26164 }, { "epoch": 0.71, "learning_rate": 3.977557303038179e-06, "loss": 1.2529, "step": 26165 }, { "epoch": 0.71, "learning_rate": 3.9768512140061734e-06, "loss": 1.5093, "step": 26166 }, { "epoch": 0.71, "learning_rate": 3.976145172096451e-06, "loss": 1.3257, "step": 26167 }, { "epoch": 0.71, "learning_rate": 3.975439177314533e-06, "loss": 1.2534, "step": 26168 }, { "epoch": 0.71, "learning_rate": 3.974733229665949e-06, "loss": 1.2915, "step": 26169 }, { "epoch": 0.71, "learning_rate": 3.974027329156219e-06, "loss": 1.3162, "step": 26170 }, { "epoch": 0.71, "learning_rate": 3.973321475790867e-06, "loss": 1.322, "step": 26171 }, { "epoch": 0.71, "learning_rate": 3.972615669575408e-06, "loss": 1.0445, "step": 26172 }, { "epoch": 0.71, "learning_rate": 3.9719099105153744e-06, "loss": 1.3157, "step": 26173 }, { "epoch": 0.71, "learning_rate": 3.971204198616284e-06, "loss": 1.2068, "step": 26174 }, { "epoch": 0.71, "learning_rate": 3.970498533883655e-06, "loss": 1.2063, "step": 26175 }, { "epoch": 0.71, "learning_rate": 3.969792916323009e-06, "loss": 1.2422, "step": 26176 }, { "epoch": 0.71, "learning_rate": 3.9690873459398694e-06, "loss": 1.1187, "step": 26177 }, { "epoch": 0.71, "learning_rate": 3.968381822739755e-06, "loss": 1.2058, "step": 26178 }, { "epoch": 0.71, "learning_rate": 3.967676346728181e-06, "loss": 1.3674, "step": 26179 }, { "epoch": 0.71, "learning_rate": 3.966970917910675e-06, "loss": 1.0933, "step": 26180 }, { "epoch": 0.71, "learning_rate": 3.966265536292751e-06, "loss": 1.3323, "step": 26181 }, { "epoch": 0.72, "learning_rate": 3.965560201879929e-06, "loss": 1.6753, "step": 26182 }, { "epoch": 0.72, "learning_rate": 3.964854914677722e-06, "loss": 1.4116, "step": 26183 }, { "epoch": 0.72, "learning_rate": 3.964149674691655e-06, "loss": 1.0288, "step": 26184 }, { "epoch": 0.72, "learning_rate": 3.963444481927244e-06, "loss": 1.5391, "step": 26185 }, { "epoch": 0.72, "learning_rate": 3.962739336390005e-06, "loss": 1.2032, "step": 26186 }, { "epoch": 0.72, "learning_rate": 3.962034238085451e-06, "loss": 1.2773, "step": 26187 }, { "epoch": 0.72, "learning_rate": 3.961329187019104e-06, "loss": 1.2473, "step": 26188 }, { "epoch": 0.72, "learning_rate": 3.960624183196479e-06, "loss": 1.3064, "step": 26189 }, { "epoch": 0.72, "learning_rate": 3.95991922662309e-06, "loss": 1.3977, "step": 26190 }, { "epoch": 0.72, "learning_rate": 3.959214317304449e-06, "loss": 1.2998, "step": 26191 }, { "epoch": 0.72, "learning_rate": 3.958509455246079e-06, "loss": 1.3035, "step": 26192 }, { "epoch": 0.72, "learning_rate": 3.95780464045349e-06, "loss": 1.355, "step": 26193 }, { "epoch": 0.72, "learning_rate": 3.9570998729321955e-06, "loss": 1.2546, "step": 26194 }, { "epoch": 0.72, "learning_rate": 3.956395152687706e-06, "loss": 1.7793, "step": 26195 }, { "epoch": 0.72, "learning_rate": 3.9556904797255404e-06, "loss": 1.3242, "step": 26196 }, { "epoch": 0.72, "learning_rate": 3.954985854051217e-06, "loss": 1.1857, "step": 26197 }, { "epoch": 0.72, "learning_rate": 3.954281275670235e-06, "loss": 1.1943, "step": 26198 }, { "epoch": 0.72, "learning_rate": 3.953576744588115e-06, "loss": 1.2432, "step": 26199 }, { "epoch": 0.72, "learning_rate": 3.952872260810365e-06, "loss": 1.2346, "step": 26200 }, { "epoch": 0.72, "learning_rate": 3.9521678243425065e-06, "loss": 1.1428, "step": 26201 }, { "epoch": 0.72, "learning_rate": 3.951463435190035e-06, "loss": 1.2415, "step": 26202 }, { "epoch": 0.72, "learning_rate": 3.950759093358474e-06, "loss": 1.3188, "step": 26203 }, { "epoch": 0.72, "learning_rate": 3.950054798853324e-06, "loss": 0.9637, "step": 26204 }, { "epoch": 0.72, "learning_rate": 3.949350551680109e-06, "loss": 1.1882, "step": 26205 }, { "epoch": 0.72, "learning_rate": 3.948646351844323e-06, "loss": 1.3264, "step": 26206 }, { "epoch": 0.72, "learning_rate": 3.947942199351486e-06, "loss": 1.1682, "step": 26207 }, { "epoch": 0.72, "learning_rate": 3.947238094207098e-06, "loss": 1.231, "step": 26208 }, { "epoch": 0.72, "learning_rate": 3.946534036416682e-06, "loss": 1.3179, "step": 26209 }, { "epoch": 0.72, "learning_rate": 3.94583002598573e-06, "loss": 1.1877, "step": 26210 }, { "epoch": 0.72, "learning_rate": 3.945126062919756e-06, "loss": 1.2778, "step": 26211 }, { "epoch": 0.72, "learning_rate": 3.944422147224273e-06, "loss": 1.1992, "step": 26212 }, { "epoch": 0.72, "learning_rate": 3.9437182789047824e-06, "loss": 1.1372, "step": 26213 }, { "epoch": 0.72, "learning_rate": 3.943014457966793e-06, "loss": 1.3469, "step": 26214 }, { "epoch": 0.72, "learning_rate": 3.9423106844158065e-06, "loss": 1.2642, "step": 26215 }, { "epoch": 0.72, "learning_rate": 3.941606958257336e-06, "loss": 1.3181, "step": 26216 }, { "epoch": 0.72, "learning_rate": 3.9409032794968835e-06, "loss": 1.0911, "step": 26217 }, { "epoch": 0.72, "learning_rate": 3.9401996481399565e-06, "loss": 1.1246, "step": 26218 }, { "epoch": 0.72, "learning_rate": 3.939496064192052e-06, "loss": 1.1182, "step": 26219 }, { "epoch": 0.72, "learning_rate": 3.938792527658686e-06, "loss": 1.4114, "step": 26220 }, { "epoch": 0.72, "learning_rate": 3.938089038545355e-06, "loss": 1.2773, "step": 26221 }, { "epoch": 0.72, "learning_rate": 3.937385596857565e-06, "loss": 1.303, "step": 26222 }, { "epoch": 0.72, "learning_rate": 3.936682202600818e-06, "loss": 1.1494, "step": 26223 }, { "epoch": 0.72, "learning_rate": 3.93597885578062e-06, "loss": 1.3384, "step": 26224 }, { "epoch": 0.72, "learning_rate": 3.935275556402473e-06, "loss": 1.2625, "step": 26225 }, { "epoch": 0.72, "learning_rate": 3.934572304471874e-06, "loss": 1.2856, "step": 26226 }, { "epoch": 0.72, "learning_rate": 3.9338690999943315e-06, "loss": 1.2339, "step": 26227 }, { "epoch": 0.72, "learning_rate": 3.933165942975347e-06, "loss": 1.1853, "step": 26228 }, { "epoch": 0.72, "learning_rate": 3.932462833420418e-06, "loss": 1.2224, "step": 26229 }, { "epoch": 0.72, "learning_rate": 3.931759771335043e-06, "loss": 1.2236, "step": 26230 }, { "epoch": 0.72, "learning_rate": 3.9310567567247305e-06, "loss": 1.2378, "step": 26231 }, { "epoch": 0.72, "learning_rate": 3.930353789594975e-06, "loss": 1.2556, "step": 26232 }, { "epoch": 0.72, "learning_rate": 3.929650869951278e-06, "loss": 1.3428, "step": 26233 }, { "epoch": 0.72, "learning_rate": 3.928947997799134e-06, "loss": 1.2271, "step": 26234 }, { "epoch": 0.72, "learning_rate": 3.928245173144051e-06, "loss": 1.1367, "step": 26235 }, { "epoch": 0.72, "learning_rate": 3.9275423959915205e-06, "loss": 1.2366, "step": 26236 }, { "epoch": 0.72, "learning_rate": 3.9268396663470446e-06, "loss": 1.229, "step": 26237 }, { "epoch": 0.72, "learning_rate": 3.926136984216114e-06, "loss": 1.3364, "step": 26238 }, { "epoch": 0.72, "learning_rate": 3.925434349604237e-06, "loss": 1.2512, "step": 26239 }, { "epoch": 0.72, "learning_rate": 3.924731762516905e-06, "loss": 1.3745, "step": 26240 }, { "epoch": 0.72, "learning_rate": 3.92402922295961e-06, "loss": 1.1538, "step": 26241 }, { "epoch": 0.72, "learning_rate": 3.923326730937857e-06, "loss": 1.2717, "step": 26242 }, { "epoch": 0.72, "learning_rate": 3.922624286457137e-06, "loss": 0.9674, "step": 26243 }, { "epoch": 0.72, "learning_rate": 3.92192188952295e-06, "loss": 1.2227, "step": 26244 }, { "epoch": 0.72, "learning_rate": 3.921219540140784e-06, "loss": 1.3806, "step": 26245 }, { "epoch": 0.72, "learning_rate": 3.920517238316141e-06, "loss": 1.292, "step": 26246 }, { "epoch": 0.72, "learning_rate": 3.919814984054508e-06, "loss": 1.2137, "step": 26247 }, { "epoch": 0.72, "learning_rate": 3.91911277736139e-06, "loss": 1.342, "step": 26248 }, { "epoch": 0.72, "learning_rate": 3.918410618242269e-06, "loss": 1.2949, "step": 26249 }, { "epoch": 0.72, "learning_rate": 3.917708506702645e-06, "loss": 1.2412, "step": 26250 }, { "epoch": 0.72, "learning_rate": 3.917006442748007e-06, "loss": 1.2402, "step": 26251 }, { "epoch": 0.72, "learning_rate": 3.916304426383858e-06, "loss": 1.3982, "step": 26252 }, { "epoch": 0.72, "learning_rate": 3.915602457615674e-06, "loss": 1.2373, "step": 26253 }, { "epoch": 0.72, "learning_rate": 3.914900536448959e-06, "loss": 1.4282, "step": 26254 }, { "epoch": 0.72, "learning_rate": 3.914198662889198e-06, "loss": 1.2112, "step": 26255 }, { "epoch": 0.72, "learning_rate": 3.913496836941888e-06, "loss": 1.092, "step": 26256 }, { "epoch": 0.72, "learning_rate": 3.912795058612517e-06, "loss": 1.162, "step": 26257 }, { "epoch": 0.72, "learning_rate": 3.912093327906571e-06, "loss": 1.2478, "step": 26258 }, { "epoch": 0.72, "learning_rate": 3.911391644829549e-06, "loss": 1.3188, "step": 26259 }, { "epoch": 0.72, "learning_rate": 3.910690009386934e-06, "loss": 1.166, "step": 26260 }, { "epoch": 0.72, "learning_rate": 3.909988421584217e-06, "loss": 1.3665, "step": 26261 }, { "epoch": 0.72, "learning_rate": 3.9092868814268844e-06, "loss": 1.3337, "step": 26262 }, { "epoch": 0.72, "learning_rate": 3.908585388920431e-06, "loss": 1.2825, "step": 26263 }, { "epoch": 0.72, "learning_rate": 3.90788394407034e-06, "loss": 1.2666, "step": 26264 }, { "epoch": 0.72, "learning_rate": 3.9071825468821e-06, "loss": 1.2727, "step": 26265 }, { "epoch": 0.72, "learning_rate": 3.906481197361196e-06, "loss": 1.4199, "step": 26266 }, { "epoch": 0.72, "learning_rate": 3.905779895513121e-06, "loss": 1.2146, "step": 26267 }, { "epoch": 0.72, "learning_rate": 3.905078641343358e-06, "loss": 1.1797, "step": 26268 }, { "epoch": 0.72, "learning_rate": 3.904377434857395e-06, "loss": 1.2812, "step": 26269 }, { "epoch": 0.72, "learning_rate": 3.903676276060711e-06, "loss": 1.2358, "step": 26270 }, { "epoch": 0.72, "learning_rate": 3.902975164958803e-06, "loss": 1.2874, "step": 26271 }, { "epoch": 0.72, "learning_rate": 3.9022741015571485e-06, "loss": 1.1978, "step": 26272 }, { "epoch": 0.72, "learning_rate": 3.901573085861232e-06, "loss": 1.7124, "step": 26273 }, { "epoch": 0.72, "learning_rate": 3.900872117876543e-06, "loss": 1.2715, "step": 26274 }, { "epoch": 0.72, "learning_rate": 3.900171197608562e-06, "loss": 1.2258, "step": 26275 }, { "epoch": 0.72, "learning_rate": 3.899470325062773e-06, "loss": 1.3481, "step": 26276 }, { "epoch": 0.72, "learning_rate": 3.898769500244657e-06, "loss": 1.3501, "step": 26277 }, { "epoch": 0.72, "learning_rate": 3.898068723159702e-06, "loss": 1.3862, "step": 26278 }, { "epoch": 0.72, "learning_rate": 3.897367993813389e-06, "loss": 1.1465, "step": 26279 }, { "epoch": 0.72, "learning_rate": 3.896667312211199e-06, "loss": 1.0759, "step": 26280 }, { "epoch": 0.72, "learning_rate": 3.895966678358609e-06, "loss": 1.1349, "step": 26281 }, { "epoch": 0.72, "learning_rate": 3.895266092261111e-06, "loss": 1.356, "step": 26282 }, { "epoch": 0.72, "learning_rate": 3.894565553924179e-06, "loss": 1.2942, "step": 26283 }, { "epoch": 0.72, "learning_rate": 3.893865063353295e-06, "loss": 1.2754, "step": 26284 }, { "epoch": 0.72, "learning_rate": 3.893164620553936e-06, "loss": 1.3638, "step": 26285 }, { "epoch": 0.72, "learning_rate": 3.89246422553159e-06, "loss": 1.1152, "step": 26286 }, { "epoch": 0.72, "learning_rate": 3.891763878291728e-06, "loss": 1.3794, "step": 26287 }, { "epoch": 0.72, "learning_rate": 3.891063578839835e-06, "loss": 1.238, "step": 26288 }, { "epoch": 0.72, "learning_rate": 3.89036332718139e-06, "loss": 1.0881, "step": 26289 }, { "epoch": 0.72, "learning_rate": 3.889663123321865e-06, "loss": 1.3616, "step": 26290 }, { "epoch": 0.72, "learning_rate": 3.888962967266746e-06, "loss": 1.2444, "step": 26291 }, { "epoch": 0.72, "learning_rate": 3.888262859021508e-06, "loss": 1.2717, "step": 26292 }, { "epoch": 0.72, "learning_rate": 3.887562798591626e-06, "loss": 1.2615, "step": 26293 }, { "epoch": 0.72, "learning_rate": 3.886862785982576e-06, "loss": 1.2097, "step": 26294 }, { "epoch": 0.72, "learning_rate": 3.88616282119984e-06, "loss": 1.2083, "step": 26295 }, { "epoch": 0.72, "learning_rate": 3.885462904248891e-06, "loss": 1.1826, "step": 26296 }, { "epoch": 0.72, "learning_rate": 3.884763035135205e-06, "loss": 1.2117, "step": 26297 }, { "epoch": 0.72, "learning_rate": 3.884063213864254e-06, "loss": 1.1667, "step": 26298 }, { "epoch": 0.72, "learning_rate": 3.883363440441521e-06, "loss": 1.3293, "step": 26299 }, { "epoch": 0.72, "learning_rate": 3.882663714872474e-06, "loss": 1.2454, "step": 26300 }, { "epoch": 0.72, "learning_rate": 3.881964037162592e-06, "loss": 1.2637, "step": 26301 }, { "epoch": 0.72, "learning_rate": 3.8812644073173415e-06, "loss": 1.0615, "step": 26302 }, { "epoch": 0.72, "learning_rate": 3.880564825342204e-06, "loss": 1.2976, "step": 26303 }, { "epoch": 0.72, "learning_rate": 3.8798652912426515e-06, "loss": 1.1648, "step": 26304 }, { "epoch": 0.72, "learning_rate": 3.879165805024151e-06, "loss": 1.2576, "step": 26305 }, { "epoch": 0.72, "learning_rate": 3.878466366692182e-06, "loss": 1.321, "step": 26306 }, { "epoch": 0.72, "learning_rate": 3.877766976252214e-06, "loss": 1.2244, "step": 26307 }, { "epoch": 0.72, "learning_rate": 3.877067633709718e-06, "loss": 1.2261, "step": 26308 }, { "epoch": 0.72, "learning_rate": 3.876368339070163e-06, "loss": 1.321, "step": 26309 }, { "epoch": 0.72, "learning_rate": 3.875669092339024e-06, "loss": 1.2627, "step": 26310 }, { "epoch": 0.72, "learning_rate": 3.8749698935217716e-06, "loss": 1.3025, "step": 26311 }, { "epoch": 0.72, "learning_rate": 3.874270742623875e-06, "loss": 1.2278, "step": 26312 }, { "epoch": 0.72, "learning_rate": 3.8735716396508e-06, "loss": 1.2177, "step": 26313 }, { "epoch": 0.72, "learning_rate": 3.872872584608022e-06, "loss": 1.1436, "step": 26314 }, { "epoch": 0.72, "learning_rate": 3.872173577501008e-06, "loss": 1.241, "step": 26315 }, { "epoch": 0.72, "learning_rate": 3.871474618335227e-06, "loss": 1.1836, "step": 26316 }, { "epoch": 0.72, "learning_rate": 3.870775707116143e-06, "loss": 1.4888, "step": 26317 }, { "epoch": 0.72, "learning_rate": 3.8700768438492305e-06, "loss": 1.2334, "step": 26318 }, { "epoch": 0.72, "learning_rate": 3.869378028539955e-06, "loss": 1.2137, "step": 26319 }, { "epoch": 0.72, "learning_rate": 3.86867926119378e-06, "loss": 1.2627, "step": 26320 }, { "epoch": 0.72, "learning_rate": 3.867980541816179e-06, "loss": 1.3657, "step": 26321 }, { "epoch": 0.72, "learning_rate": 3.86728187041261e-06, "loss": 1.4045, "step": 26322 }, { "epoch": 0.72, "learning_rate": 3.866583246988551e-06, "loss": 1.2632, "step": 26323 }, { "epoch": 0.72, "learning_rate": 3.865884671549455e-06, "loss": 1.1245, "step": 26324 }, { "epoch": 0.72, "learning_rate": 3.865186144100794e-06, "loss": 1.2744, "step": 26325 }, { "epoch": 0.72, "learning_rate": 3.86448766464803e-06, "loss": 1.2236, "step": 26326 }, { "epoch": 0.72, "learning_rate": 3.8637892331966366e-06, "loss": 1.3862, "step": 26327 }, { "epoch": 0.72, "learning_rate": 3.863090849752062e-06, "loss": 1.3464, "step": 26328 }, { "epoch": 0.72, "learning_rate": 3.862392514319785e-06, "loss": 1.3796, "step": 26329 }, { "epoch": 0.72, "learning_rate": 3.861694226905257e-06, "loss": 1.4534, "step": 26330 }, { "epoch": 0.72, "learning_rate": 3.860995987513956e-06, "loss": 1.1995, "step": 26331 }, { "epoch": 0.72, "learning_rate": 3.860297796151327e-06, "loss": 1.2434, "step": 26332 }, { "epoch": 0.72, "learning_rate": 3.859599652822845e-06, "loss": 1.2778, "step": 26333 }, { "epoch": 0.72, "learning_rate": 3.858901557533964e-06, "loss": 1.0291, "step": 26334 }, { "epoch": 0.72, "learning_rate": 3.858203510290154e-06, "loss": 1.1868, "step": 26335 }, { "epoch": 0.72, "learning_rate": 3.857505511096871e-06, "loss": 1.281, "step": 26336 }, { "epoch": 0.72, "learning_rate": 3.856807559959572e-06, "loss": 1.314, "step": 26337 }, { "epoch": 0.72, "learning_rate": 3.856109656883726e-06, "loss": 1.2656, "step": 26338 }, { "epoch": 0.72, "learning_rate": 3.85541180187479e-06, "loss": 1.6616, "step": 26339 }, { "epoch": 0.72, "learning_rate": 3.854713994938221e-06, "loss": 1.0845, "step": 26340 }, { "epoch": 0.72, "learning_rate": 3.854016236079479e-06, "loss": 1.2874, "step": 26341 }, { "epoch": 0.72, "learning_rate": 3.853318525304025e-06, "loss": 1.3667, "step": 26342 }, { "epoch": 0.72, "learning_rate": 3.8526208626173174e-06, "loss": 1.0684, "step": 26343 }, { "epoch": 0.72, "learning_rate": 3.851923248024814e-06, "loss": 1.0425, "step": 26344 }, { "epoch": 0.72, "learning_rate": 3.851225681531968e-06, "loss": 1.2642, "step": 26345 }, { "epoch": 0.72, "learning_rate": 3.850528163144243e-06, "loss": 1.26, "step": 26346 }, { "epoch": 0.72, "learning_rate": 3.849830692867097e-06, "loss": 1.2371, "step": 26347 }, { "epoch": 0.72, "learning_rate": 3.8491332707059815e-06, "loss": 1.1099, "step": 26348 }, { "epoch": 0.72, "learning_rate": 3.848435896666352e-06, "loss": 1.3352, "step": 26349 }, { "epoch": 0.72, "learning_rate": 3.847738570753671e-06, "loss": 1.1799, "step": 26350 }, { "epoch": 0.72, "learning_rate": 3.84704129297339e-06, "loss": 1.1445, "step": 26351 }, { "epoch": 0.72, "learning_rate": 3.846344063330961e-06, "loss": 1.2808, "step": 26352 }, { "epoch": 0.72, "learning_rate": 3.845646881831847e-06, "loss": 1.1763, "step": 26353 }, { "epoch": 0.72, "learning_rate": 3.844949748481497e-06, "loss": 1.2622, "step": 26354 }, { "epoch": 0.72, "learning_rate": 3.844252663285366e-06, "loss": 1.1726, "step": 26355 }, { "epoch": 0.72, "learning_rate": 3.843555626248904e-06, "loss": 1.3535, "step": 26356 }, { "epoch": 0.72, "learning_rate": 3.842858637377571e-06, "loss": 1.2461, "step": 26357 }, { "epoch": 0.72, "learning_rate": 3.842161696676817e-06, "loss": 1.4038, "step": 26358 }, { "epoch": 0.72, "learning_rate": 3.841464804152095e-06, "loss": 1.3364, "step": 26359 }, { "epoch": 0.72, "learning_rate": 3.840767959808852e-06, "loss": 1.2271, "step": 26360 }, { "epoch": 0.72, "learning_rate": 3.840071163652548e-06, "loss": 1.3975, "step": 26361 }, { "epoch": 0.72, "learning_rate": 3.83937441568863e-06, "loss": 1.2964, "step": 26362 }, { "epoch": 0.72, "learning_rate": 3.838677715922551e-06, "loss": 1.3154, "step": 26363 }, { "epoch": 0.72, "learning_rate": 3.837981064359756e-06, "loss": 1.2268, "step": 26364 }, { "epoch": 0.72, "learning_rate": 3.837284461005699e-06, "loss": 1.1135, "step": 26365 }, { "epoch": 0.72, "learning_rate": 3.836587905865838e-06, "loss": 1.2771, "step": 26366 }, { "epoch": 0.72, "learning_rate": 3.8358913989456084e-06, "loss": 1.165, "step": 26367 }, { "epoch": 0.72, "learning_rate": 3.835194940250469e-06, "loss": 1.2949, "step": 26368 }, { "epoch": 0.72, "learning_rate": 3.834498529785863e-06, "loss": 1.2861, "step": 26369 }, { "epoch": 0.72, "learning_rate": 3.833802167557246e-06, "loss": 1.2048, "step": 26370 }, { "epoch": 0.72, "learning_rate": 3.833105853570056e-06, "loss": 1.1985, "step": 26371 }, { "epoch": 0.72, "learning_rate": 3.832409587829749e-06, "loss": 1.2675, "step": 26372 }, { "epoch": 0.72, "learning_rate": 3.831713370341766e-06, "loss": 1.7437, "step": 26373 }, { "epoch": 0.72, "learning_rate": 3.831017201111565e-06, "loss": 1.2327, "step": 26374 }, { "epoch": 0.72, "learning_rate": 3.830321080144576e-06, "loss": 1.2244, "step": 26375 }, { "epoch": 0.72, "learning_rate": 3.829625007446257e-06, "loss": 1.1377, "step": 26376 }, { "epoch": 0.72, "learning_rate": 3.828928983022046e-06, "loss": 1.3994, "step": 26377 }, { "epoch": 0.72, "learning_rate": 3.828233006877402e-06, "loss": 1.3201, "step": 26378 }, { "epoch": 0.72, "learning_rate": 3.8275370790177535e-06, "loss": 1.2485, "step": 26379 }, { "epoch": 0.72, "learning_rate": 3.826841199448555e-06, "loss": 1.1904, "step": 26380 }, { "epoch": 0.72, "learning_rate": 3.826145368175245e-06, "loss": 1.3665, "step": 26381 }, { "epoch": 0.72, "learning_rate": 3.825449585203275e-06, "loss": 1.2239, "step": 26382 }, { "epoch": 0.72, "learning_rate": 3.824753850538082e-06, "loss": 1.0806, "step": 26383 }, { "epoch": 0.72, "learning_rate": 3.8240581641851095e-06, "loss": 1.2627, "step": 26384 }, { "epoch": 0.72, "learning_rate": 3.823362526149804e-06, "loss": 1.0781, "step": 26385 }, { "epoch": 0.72, "learning_rate": 3.822666936437605e-06, "loss": 1.3271, "step": 26386 }, { "epoch": 0.72, "learning_rate": 3.821971395053957e-06, "loss": 1.3042, "step": 26387 }, { "epoch": 0.72, "learning_rate": 3.8212759020042955e-06, "loss": 1.1638, "step": 26388 }, { "epoch": 0.72, "learning_rate": 3.820580457294069e-06, "loss": 1.2847, "step": 26389 }, { "epoch": 0.72, "learning_rate": 3.819885060928715e-06, "loss": 1.4397, "step": 26390 }, { "epoch": 0.72, "learning_rate": 3.819189712913675e-06, "loss": 1.3381, "step": 26391 }, { "epoch": 0.72, "learning_rate": 3.818494413254384e-06, "loss": 1.3787, "step": 26392 }, { "epoch": 0.72, "learning_rate": 3.817799161956291e-06, "loss": 1.2422, "step": 26393 }, { "epoch": 0.72, "learning_rate": 3.817103959024828e-06, "loss": 1.3552, "step": 26394 }, { "epoch": 0.72, "learning_rate": 3.816408804465438e-06, "loss": 1.1294, "step": 26395 }, { "epoch": 0.72, "learning_rate": 3.815713698283553e-06, "loss": 1.3748, "step": 26396 }, { "epoch": 0.72, "learning_rate": 3.81501864048462e-06, "loss": 1.4365, "step": 26397 }, { "epoch": 0.72, "learning_rate": 3.8143236310740738e-06, "loss": 1.1821, "step": 26398 }, { "epoch": 0.72, "learning_rate": 3.8136286700573456e-06, "loss": 1.2832, "step": 26399 }, { "epoch": 0.72, "learning_rate": 3.8129337574398827e-06, "loss": 1.2007, "step": 26400 }, { "epoch": 0.72, "learning_rate": 3.812238893227116e-06, "loss": 1.2759, "step": 26401 }, { "epoch": 0.72, "learning_rate": 3.8115440774244816e-06, "loss": 1.3745, "step": 26402 }, { "epoch": 0.72, "learning_rate": 3.8108493100374142e-06, "loss": 1.1541, "step": 26403 }, { "epoch": 0.72, "learning_rate": 3.8101545910713546e-06, "loss": 1.3943, "step": 26404 }, { "epoch": 0.72, "learning_rate": 3.809459920531734e-06, "loss": 1.2761, "step": 26405 }, { "epoch": 0.72, "learning_rate": 3.8087652984239887e-06, "loss": 1.2056, "step": 26406 }, { "epoch": 0.72, "learning_rate": 3.8080707247535486e-06, "loss": 1.2148, "step": 26407 }, { "epoch": 0.72, "learning_rate": 3.807376199525856e-06, "loss": 1.1794, "step": 26408 }, { "epoch": 0.72, "learning_rate": 3.8066817227463392e-06, "loss": 1.3411, "step": 26409 }, { "epoch": 0.72, "learning_rate": 3.8059872944204324e-06, "loss": 1.271, "step": 26410 }, { "epoch": 0.72, "learning_rate": 3.8052929145535646e-06, "loss": 1.3193, "step": 26411 }, { "epoch": 0.72, "learning_rate": 3.804598583151172e-06, "loss": 1.3123, "step": 26412 }, { "epoch": 0.72, "learning_rate": 3.8039043002186946e-06, "loss": 1.2432, "step": 26413 }, { "epoch": 0.72, "learning_rate": 3.803210065761549e-06, "loss": 1.3621, "step": 26414 }, { "epoch": 0.72, "learning_rate": 3.802515879785177e-06, "loss": 1.3003, "step": 26415 }, { "epoch": 0.72, "learning_rate": 3.8018217422950034e-06, "loss": 1.1963, "step": 26416 }, { "epoch": 0.72, "learning_rate": 3.8011276532964693e-06, "loss": 1.4009, "step": 26417 }, { "epoch": 0.72, "learning_rate": 3.800433612794989e-06, "loss": 1.218, "step": 26418 }, { "epoch": 0.72, "learning_rate": 3.799739620796006e-06, "loss": 1.3125, "step": 26419 }, { "epoch": 0.72, "learning_rate": 3.79904567730494e-06, "loss": 1.2832, "step": 26420 }, { "epoch": 0.72, "learning_rate": 3.798351782327232e-06, "loss": 1.2664, "step": 26421 }, { "epoch": 0.72, "learning_rate": 3.7976579358682973e-06, "loss": 1.3, "step": 26422 }, { "epoch": 0.72, "learning_rate": 3.796964137933573e-06, "loss": 1.1833, "step": 26423 }, { "epoch": 0.72, "learning_rate": 3.7962703885284813e-06, "loss": 1.2886, "step": 26424 }, { "epoch": 0.72, "learning_rate": 3.79557668765846e-06, "loss": 1.0901, "step": 26425 }, { "epoch": 0.72, "learning_rate": 3.7948830353289214e-06, "loss": 1.1638, "step": 26426 }, { "epoch": 0.72, "learning_rate": 3.794189431545301e-06, "loss": 1.3796, "step": 26427 }, { "epoch": 0.72, "learning_rate": 3.793495876313027e-06, "loss": 1.1897, "step": 26428 }, { "epoch": 0.72, "learning_rate": 3.7928023696375227e-06, "loss": 1.2104, "step": 26429 }, { "epoch": 0.72, "learning_rate": 3.792108911524215e-06, "loss": 0.9666, "step": 26430 }, { "epoch": 0.72, "learning_rate": 3.791415501978524e-06, "loss": 1.1108, "step": 26431 }, { "epoch": 0.72, "learning_rate": 3.7907221410058815e-06, "loss": 1.1799, "step": 26432 }, { "epoch": 0.72, "learning_rate": 3.790028828611709e-06, "loss": 1.2578, "step": 26433 }, { "epoch": 0.72, "learning_rate": 3.789335564801432e-06, "loss": 1.1526, "step": 26434 }, { "epoch": 0.72, "learning_rate": 3.7886423495804694e-06, "loss": 1.2769, "step": 26435 }, { "epoch": 0.72, "learning_rate": 3.7879491829542513e-06, "loss": 1.3657, "step": 26436 }, { "epoch": 0.72, "learning_rate": 3.7872560649281973e-06, "loss": 1.3337, "step": 26437 }, { "epoch": 0.72, "learning_rate": 3.786562995507731e-06, "loss": 1.3025, "step": 26438 }, { "epoch": 0.72, "learning_rate": 3.785869974698271e-06, "loss": 1.1899, "step": 26439 }, { "epoch": 0.72, "learning_rate": 3.785177002505245e-06, "loss": 1.3074, "step": 26440 }, { "epoch": 0.72, "learning_rate": 3.784484078934071e-06, "loss": 1.1382, "step": 26441 }, { "epoch": 0.72, "learning_rate": 3.7837912039901727e-06, "loss": 1.323, "step": 26442 }, { "epoch": 0.72, "learning_rate": 3.7830983776789644e-06, "loss": 1.23, "step": 26443 }, { "epoch": 0.72, "learning_rate": 3.782405600005874e-06, "loss": 1.1987, "step": 26444 }, { "epoch": 0.72, "learning_rate": 3.7817128709763186e-06, "loss": 1.4543, "step": 26445 }, { "epoch": 0.72, "learning_rate": 3.7810201905957145e-06, "loss": 1.4297, "step": 26446 }, { "epoch": 0.72, "learning_rate": 3.7803275588694876e-06, "loss": 1.3333, "step": 26447 }, { "epoch": 0.72, "learning_rate": 3.779634975803054e-06, "loss": 1.2119, "step": 26448 }, { "epoch": 0.72, "learning_rate": 3.7789424414018304e-06, "loss": 1.2056, "step": 26449 }, { "epoch": 0.72, "learning_rate": 3.7782499556712314e-06, "loss": 1.4482, "step": 26450 }, { "epoch": 0.72, "learning_rate": 3.7775575186166848e-06, "loss": 1.2585, "step": 26451 }, { "epoch": 0.72, "learning_rate": 3.7768651302436e-06, "loss": 1.2773, "step": 26452 }, { "epoch": 0.72, "learning_rate": 3.7761727905573974e-06, "loss": 1.2532, "step": 26453 }, { "epoch": 0.72, "learning_rate": 3.7754804995634884e-06, "loss": 1.2534, "step": 26454 }, { "epoch": 0.72, "learning_rate": 3.774788257267297e-06, "loss": 1.2219, "step": 26455 }, { "epoch": 0.72, "learning_rate": 3.7740960636742342e-06, "loss": 1.1289, "step": 26456 }, { "epoch": 0.72, "learning_rate": 3.7734039187897165e-06, "loss": 1.1833, "step": 26457 }, { "epoch": 0.72, "learning_rate": 3.772711822619155e-06, "loss": 1.3623, "step": 26458 }, { "epoch": 0.72, "learning_rate": 3.772019775167968e-06, "loss": 1.3652, "step": 26459 }, { "epoch": 0.72, "learning_rate": 3.7713277764415767e-06, "loss": 1.396, "step": 26460 }, { "epoch": 0.72, "learning_rate": 3.77063582644538e-06, "loss": 1.0967, "step": 26461 }, { "epoch": 0.72, "learning_rate": 3.7699439251848045e-06, "loss": 1.0497, "step": 26462 }, { "epoch": 0.72, "learning_rate": 3.7692520726652536e-06, "loss": 1.2747, "step": 26463 }, { "epoch": 0.72, "learning_rate": 3.768560268892152e-06, "loss": 1.3596, "step": 26464 }, { "epoch": 0.72, "learning_rate": 3.7678685138708972e-06, "loss": 1.623, "step": 26465 }, { "epoch": 0.72, "learning_rate": 3.7671768076069126e-06, "loss": 1.2671, "step": 26466 }, { "epoch": 0.72, "learning_rate": 3.766485150105602e-06, "loss": 1.647, "step": 26467 }, { "epoch": 0.72, "learning_rate": 3.7657935413723876e-06, "loss": 1.2098, "step": 26468 }, { "epoch": 0.72, "learning_rate": 3.7651019814126656e-06, "loss": 1.2612, "step": 26469 }, { "epoch": 0.72, "learning_rate": 3.7644104702318575e-06, "loss": 1.113, "step": 26470 }, { "epoch": 0.72, "learning_rate": 3.763719007835367e-06, "loss": 1.2573, "step": 26471 }, { "epoch": 0.72, "learning_rate": 3.7630275942286122e-06, "loss": 1.1876, "step": 26472 }, { "epoch": 0.72, "learning_rate": 3.762336229416991e-06, "loss": 1.2683, "step": 26473 }, { "epoch": 0.72, "learning_rate": 3.7616449134059163e-06, "loss": 1.2122, "step": 26474 }, { "epoch": 0.72, "learning_rate": 3.7609536462008034e-06, "loss": 1.3638, "step": 26475 }, { "epoch": 0.72, "learning_rate": 3.7602624278070543e-06, "loss": 1.2424, "step": 26476 }, { "epoch": 0.72, "learning_rate": 3.759571258230078e-06, "loss": 1.2744, "step": 26477 }, { "epoch": 0.72, "learning_rate": 3.758880137475278e-06, "loss": 1.3625, "step": 26478 }, { "epoch": 0.72, "learning_rate": 3.758189065548069e-06, "loss": 1.24, "step": 26479 }, { "epoch": 0.72, "learning_rate": 3.757498042453854e-06, "loss": 1.1001, "step": 26480 }, { "epoch": 0.72, "learning_rate": 3.7568070681980384e-06, "loss": 1.2122, "step": 26481 }, { "epoch": 0.72, "learning_rate": 3.756116142786025e-06, "loss": 1.1271, "step": 26482 }, { "epoch": 0.72, "learning_rate": 3.755425266223227e-06, "loss": 1.3159, "step": 26483 }, { "epoch": 0.72, "learning_rate": 3.7547344385150443e-06, "loss": 1.2783, "step": 26484 }, { "epoch": 0.72, "learning_rate": 3.754043659666884e-06, "loss": 1.345, "step": 26485 }, { "epoch": 0.72, "learning_rate": 3.753352929684144e-06, "loss": 1.3689, "step": 26486 }, { "epoch": 0.72, "learning_rate": 3.7526622485722376e-06, "loss": 1.334, "step": 26487 }, { "epoch": 0.72, "learning_rate": 3.7519716163365637e-06, "loss": 1.2671, "step": 26488 }, { "epoch": 0.72, "learning_rate": 3.7512810329825224e-06, "loss": 1.1873, "step": 26489 }, { "epoch": 0.72, "learning_rate": 3.750590498515524e-06, "loss": 1.3838, "step": 26490 }, { "epoch": 0.72, "learning_rate": 3.749900012940966e-06, "loss": 1.217, "step": 26491 }, { "epoch": 0.72, "learning_rate": 3.7492095762642523e-06, "loss": 1.2646, "step": 26492 }, { "epoch": 0.72, "learning_rate": 3.748519188490779e-06, "loss": 1.2346, "step": 26493 }, { "epoch": 0.72, "learning_rate": 3.7478288496259564e-06, "loss": 1.3096, "step": 26494 }, { "epoch": 0.72, "learning_rate": 3.7471385596751796e-06, "loss": 1.2131, "step": 26495 }, { "epoch": 0.72, "learning_rate": 3.7464483186438517e-06, "loss": 1.2742, "step": 26496 }, { "epoch": 0.72, "learning_rate": 3.7457581265373676e-06, "loss": 1.2249, "step": 26497 }, { "epoch": 0.72, "learning_rate": 3.7450679833611346e-06, "loss": 1.0754, "step": 26498 }, { "epoch": 0.72, "learning_rate": 3.7443778891205483e-06, "loss": 1.3911, "step": 26499 }, { "epoch": 0.72, "learning_rate": 3.7436878438210077e-06, "loss": 1.3181, "step": 26500 }, { "epoch": 0.72, "learning_rate": 3.7429978474679073e-06, "loss": 1.3862, "step": 26501 }, { "epoch": 0.72, "learning_rate": 3.742307900066654e-06, "loss": 1.3491, "step": 26502 }, { "epoch": 0.72, "learning_rate": 3.741618001622641e-06, "loss": 1.1487, "step": 26503 }, { "epoch": 0.72, "learning_rate": 3.7409281521412653e-06, "loss": 1.2009, "step": 26504 }, { "epoch": 0.72, "learning_rate": 3.7402383516279217e-06, "loss": 1.3403, "step": 26505 }, { "epoch": 0.72, "learning_rate": 3.7395486000880097e-06, "loss": 1.3108, "step": 26506 }, { "epoch": 0.72, "learning_rate": 3.7388588975269326e-06, "loss": 1.2456, "step": 26507 }, { "epoch": 0.72, "learning_rate": 3.7381692439500715e-06, "loss": 1.4053, "step": 26508 }, { "epoch": 0.72, "learning_rate": 3.737479639362833e-06, "loss": 1.3823, "step": 26509 }, { "epoch": 0.72, "learning_rate": 3.7367900837706074e-06, "loss": 1.3159, "step": 26510 }, { "epoch": 0.72, "learning_rate": 3.7361005771787964e-06, "loss": 1.4543, "step": 26511 }, { "epoch": 0.72, "learning_rate": 3.735411119592782e-06, "loss": 1.3176, "step": 26512 }, { "epoch": 0.72, "learning_rate": 3.734721711017969e-06, "loss": 1.1646, "step": 26513 }, { "epoch": 0.72, "learning_rate": 3.7340323514597444e-06, "loss": 1.3584, "step": 26514 }, { "epoch": 0.72, "learning_rate": 3.7333430409235105e-06, "loss": 1.0173, "step": 26515 }, { "epoch": 0.72, "learning_rate": 3.7326537794146468e-06, "loss": 1.3669, "step": 26516 }, { "epoch": 0.72, "learning_rate": 3.731964566938556e-06, "loss": 1.2192, "step": 26517 }, { "epoch": 0.72, "learning_rate": 3.731275403500624e-06, "loss": 1.2896, "step": 26518 }, { "epoch": 0.72, "learning_rate": 3.7305862891062485e-06, "loss": 1.3167, "step": 26519 }, { "epoch": 0.72, "learning_rate": 3.729897223760819e-06, "loss": 1.291, "step": 26520 }, { "epoch": 0.72, "learning_rate": 3.72920820746972e-06, "loss": 1.2891, "step": 26521 }, { "epoch": 0.72, "learning_rate": 3.728519240238352e-06, "loss": 1.3005, "step": 26522 }, { "epoch": 0.72, "learning_rate": 3.7278303220721e-06, "loss": 1.1646, "step": 26523 }, { "epoch": 0.72, "learning_rate": 3.727141452976354e-06, "loss": 1.0999, "step": 26524 }, { "epoch": 0.72, "learning_rate": 3.726452632956501e-06, "loss": 1.3462, "step": 26525 }, { "epoch": 0.72, "learning_rate": 3.725763862017935e-06, "loss": 1.136, "step": 26526 }, { "epoch": 0.72, "learning_rate": 3.7250751401660423e-06, "loss": 1.0974, "step": 26527 }, { "epoch": 0.72, "learning_rate": 3.724386467406211e-06, "loss": 1.2332, "step": 26528 }, { "epoch": 0.72, "learning_rate": 3.7236978437438266e-06, "loss": 1.0573, "step": 26529 }, { "epoch": 0.72, "learning_rate": 3.723009269184281e-06, "loss": 1.3315, "step": 26530 }, { "epoch": 0.72, "learning_rate": 3.72232074373296e-06, "loss": 1.3059, "step": 26531 }, { "epoch": 0.72, "learning_rate": 3.72163226739525e-06, "loss": 1.2495, "step": 26532 }, { "epoch": 0.72, "learning_rate": 3.720943840176532e-06, "loss": 1.2292, "step": 26533 }, { "epoch": 0.72, "learning_rate": 3.7202554620822005e-06, "loss": 1.3052, "step": 26534 }, { "epoch": 0.72, "learning_rate": 3.7195671331176385e-06, "loss": 1.2488, "step": 26535 }, { "epoch": 0.72, "learning_rate": 3.7188788532882258e-06, "loss": 1.1638, "step": 26536 }, { "epoch": 0.72, "learning_rate": 3.718190622599355e-06, "loss": 1.199, "step": 26537 }, { "epoch": 0.72, "learning_rate": 3.7175024410564063e-06, "loss": 1.167, "step": 26538 }, { "epoch": 0.72, "learning_rate": 3.7168143086647645e-06, "loss": 1.3145, "step": 26539 }, { "epoch": 0.72, "learning_rate": 3.7161262254298104e-06, "loss": 1.2886, "step": 26540 }, { "epoch": 0.72, "learning_rate": 3.7154381913569327e-06, "loss": 1.2217, "step": 26541 }, { "epoch": 0.72, "learning_rate": 3.7147502064515105e-06, "loss": 1.3906, "step": 26542 }, { "epoch": 0.72, "learning_rate": 3.714062270718928e-06, "loss": 1.1465, "step": 26543 }, { "epoch": 0.72, "learning_rate": 3.713374384164563e-06, "loss": 1.3167, "step": 26544 }, { "epoch": 0.72, "learning_rate": 3.7126865467938043e-06, "loss": 1.1365, "step": 26545 }, { "epoch": 0.72, "learning_rate": 3.711998758612029e-06, "loss": 1.2754, "step": 26546 }, { "epoch": 0.72, "learning_rate": 3.7113110196246184e-06, "loss": 1.2109, "step": 26547 }, { "epoch": 0.73, "learning_rate": 3.710623329836951e-06, "loss": 1.1289, "step": 26548 }, { "epoch": 0.73, "learning_rate": 3.7099356892544114e-06, "loss": 1.3196, "step": 26549 }, { "epoch": 0.73, "learning_rate": 3.709248097882374e-06, "loss": 1.1316, "step": 26550 }, { "epoch": 0.73, "learning_rate": 3.708560555726225e-06, "loss": 1.3564, "step": 26551 }, { "epoch": 0.73, "learning_rate": 3.7078730627913397e-06, "loss": 1.2209, "step": 26552 }, { "epoch": 0.73, "learning_rate": 3.7071856190830934e-06, "loss": 1.2651, "step": 26553 }, { "epoch": 0.73, "learning_rate": 3.7064982246068715e-06, "loss": 1.2139, "step": 26554 }, { "epoch": 0.73, "learning_rate": 3.7058108793680467e-06, "loss": 1.2903, "step": 26555 }, { "epoch": 0.73, "learning_rate": 3.705123583372e-06, "loss": 1.0544, "step": 26556 }, { "epoch": 0.73, "learning_rate": 3.704436336624101e-06, "loss": 1.1367, "step": 26557 }, { "epoch": 0.73, "learning_rate": 3.7037491391297365e-06, "loss": 1.2046, "step": 26558 }, { "epoch": 0.73, "learning_rate": 3.7030619908942776e-06, "loss": 1.2937, "step": 26559 }, { "epoch": 0.73, "learning_rate": 3.7023748919231007e-06, "loss": 1.145, "step": 26560 }, { "epoch": 0.73, "learning_rate": 3.7016878422215773e-06, "loss": 1.3491, "step": 26561 }, { "epoch": 0.73, "learning_rate": 3.7010008417950906e-06, "loss": 1.3704, "step": 26562 }, { "epoch": 0.73, "learning_rate": 3.700313890649011e-06, "loss": 1.2258, "step": 26563 }, { "epoch": 0.73, "learning_rate": 3.699626988788713e-06, "loss": 1.313, "step": 26564 }, { "epoch": 0.73, "learning_rate": 3.6989401362195676e-06, "loss": 1.3601, "step": 26565 }, { "epoch": 0.73, "learning_rate": 3.698253332946955e-06, "loss": 1.2244, "step": 26566 }, { "epoch": 0.73, "learning_rate": 3.697566578976245e-06, "loss": 1.0835, "step": 26567 }, { "epoch": 0.73, "learning_rate": 3.6968798743128078e-06, "loss": 1.2944, "step": 26568 }, { "epoch": 0.73, "learning_rate": 3.6961932189620207e-06, "loss": 1.1973, "step": 26569 }, { "epoch": 0.73, "learning_rate": 3.695506612929254e-06, "loss": 1.3254, "step": 26570 }, { "epoch": 0.73, "learning_rate": 3.69482005621988e-06, "loss": 1.2583, "step": 26571 }, { "epoch": 0.73, "learning_rate": 3.6941335488392636e-06, "loss": 1.3269, "step": 26572 }, { "epoch": 0.73, "learning_rate": 3.6934470907927864e-06, "loss": 1.2661, "step": 26573 }, { "epoch": 0.73, "learning_rate": 3.6927606820858133e-06, "loss": 1.3289, "step": 26574 }, { "epoch": 0.73, "learning_rate": 3.6920743227237134e-06, "loss": 1.3206, "step": 26575 }, { "epoch": 0.73, "learning_rate": 3.691388012711855e-06, "loss": 1.4548, "step": 26576 }, { "epoch": 0.73, "learning_rate": 3.690701752055614e-06, "loss": 1.2329, "step": 26577 }, { "epoch": 0.73, "learning_rate": 3.6900155407603568e-06, "loss": 0.9832, "step": 26578 }, { "epoch": 0.73, "learning_rate": 3.689329378831449e-06, "loss": 1.3589, "step": 26579 }, { "epoch": 0.73, "learning_rate": 3.6886432662742576e-06, "loss": 1.3032, "step": 26580 }, { "epoch": 0.73, "learning_rate": 3.687957203094158e-06, "loss": 1.1658, "step": 26581 }, { "epoch": 0.73, "learning_rate": 3.6872711892965118e-06, "loss": 1.2795, "step": 26582 }, { "epoch": 0.73, "learning_rate": 3.686585224886684e-06, "loss": 1.1814, "step": 26583 }, { "epoch": 0.73, "learning_rate": 3.685899309870049e-06, "loss": 1.1941, "step": 26584 }, { "epoch": 0.73, "learning_rate": 3.6852134442519647e-06, "loss": 1.3196, "step": 26585 }, { "epoch": 0.73, "learning_rate": 3.6845276280378085e-06, "loss": 1.2688, "step": 26586 }, { "epoch": 0.73, "learning_rate": 3.6838418612329306e-06, "loss": 1.1613, "step": 26587 }, { "epoch": 0.73, "learning_rate": 3.6831561438427076e-06, "loss": 1.3599, "step": 26588 }, { "epoch": 0.73, "learning_rate": 3.6824704758724973e-06, "loss": 1.3003, "step": 26589 }, { "epoch": 0.73, "learning_rate": 3.681784857327674e-06, "loss": 1.2539, "step": 26590 }, { "epoch": 0.73, "learning_rate": 3.6810992882135876e-06, "loss": 1.3335, "step": 26591 }, { "epoch": 0.73, "learning_rate": 3.6804137685356136e-06, "loss": 1.1963, "step": 26592 }, { "epoch": 0.73, "learning_rate": 3.679728298299107e-06, "loss": 1.3857, "step": 26593 }, { "epoch": 0.73, "learning_rate": 3.67904287750944e-06, "loss": 1.3689, "step": 26594 }, { "epoch": 0.73, "learning_rate": 3.6783575061719634e-06, "loss": 1.1851, "step": 26595 }, { "epoch": 0.73, "learning_rate": 3.6776721842920483e-06, "loss": 1.3833, "step": 26596 }, { "epoch": 0.73, "learning_rate": 3.676986911875049e-06, "loss": 1.0503, "step": 26597 }, { "epoch": 0.73, "learning_rate": 3.6763016889263348e-06, "loss": 1.229, "step": 26598 }, { "epoch": 0.73, "learning_rate": 3.6756165154512613e-06, "loss": 1.4463, "step": 26599 }, { "epoch": 0.73, "learning_rate": 3.6749313914551885e-06, "loss": 1.1216, "step": 26600 }, { "epoch": 0.73, "learning_rate": 3.6742463169434806e-06, "loss": 1.2395, "step": 26601 }, { "epoch": 0.73, "learning_rate": 3.6735612919214958e-06, "loss": 1.385, "step": 26602 }, { "epoch": 0.73, "learning_rate": 3.6728763163945925e-06, "loss": 1.0547, "step": 26603 }, { "epoch": 0.73, "learning_rate": 3.672191390368125e-06, "loss": 1.1799, "step": 26604 }, { "epoch": 0.73, "learning_rate": 3.6715065138474617e-06, "loss": 1.3994, "step": 26605 }, { "epoch": 0.73, "learning_rate": 3.670821686837954e-06, "loss": 1.2651, "step": 26606 }, { "epoch": 0.73, "learning_rate": 3.6701369093449624e-06, "loss": 1.2819, "step": 26607 }, { "epoch": 0.73, "learning_rate": 3.669452181373839e-06, "loss": 1.2966, "step": 26608 }, { "epoch": 0.73, "learning_rate": 3.6687675029299486e-06, "loss": 1.2886, "step": 26609 }, { "epoch": 0.73, "learning_rate": 3.6680828740186436e-06, "loss": 1.283, "step": 26610 }, { "epoch": 0.73, "learning_rate": 3.6673982946452813e-06, "loss": 0.9856, "step": 26611 }, { "epoch": 0.73, "learning_rate": 3.666713764815214e-06, "loss": 1.301, "step": 26612 }, { "epoch": 0.73, "learning_rate": 3.666029284533802e-06, "loss": 1.3154, "step": 26613 }, { "epoch": 0.73, "learning_rate": 3.6653448538063998e-06, "loss": 1.3665, "step": 26614 }, { "epoch": 0.73, "learning_rate": 3.664660472638357e-06, "loss": 1.3591, "step": 26615 }, { "epoch": 0.73, "learning_rate": 3.663976141035035e-06, "loss": 1.3059, "step": 26616 }, { "epoch": 0.73, "learning_rate": 3.6632918590017842e-06, "loss": 1.6807, "step": 26617 }, { "epoch": 0.73, "learning_rate": 3.662607626543957e-06, "loss": 1.2703, "step": 26618 }, { "epoch": 0.73, "learning_rate": 3.661923443666906e-06, "loss": 1.3855, "step": 26619 }, { "epoch": 0.73, "learning_rate": 3.661239310375988e-06, "loss": 1.1006, "step": 26620 }, { "epoch": 0.73, "learning_rate": 3.6605552266765533e-06, "loss": 1.2307, "step": 26621 }, { "epoch": 0.73, "learning_rate": 3.6598711925739538e-06, "loss": 1.2949, "step": 26622 }, { "epoch": 0.73, "learning_rate": 3.659187208073537e-06, "loss": 1.1643, "step": 26623 }, { "epoch": 0.73, "learning_rate": 3.6585032731806604e-06, "loss": 1.356, "step": 26624 }, { "epoch": 0.73, "learning_rate": 3.657819387900673e-06, "loss": 1.2407, "step": 26625 }, { "epoch": 0.73, "learning_rate": 3.657135552238925e-06, "loss": 1.2424, "step": 26626 }, { "epoch": 0.73, "learning_rate": 3.6564517662007614e-06, "loss": 1.1011, "step": 26627 }, { "epoch": 0.73, "learning_rate": 3.6557680297915398e-06, "loss": 1.3533, "step": 26628 }, { "epoch": 0.73, "learning_rate": 3.655084343016606e-06, "loss": 1.2314, "step": 26629 }, { "epoch": 0.73, "learning_rate": 3.6544007058813056e-06, "loss": 1.2549, "step": 26630 }, { "epoch": 0.73, "learning_rate": 3.6537171183909937e-06, "loss": 1.3113, "step": 26631 }, { "epoch": 0.73, "learning_rate": 3.653033580551011e-06, "loss": 1.3352, "step": 26632 }, { "epoch": 0.73, "learning_rate": 3.6523500923667167e-06, "loss": 1.2471, "step": 26633 }, { "epoch": 0.73, "learning_rate": 3.651666653843442e-06, "loss": 1.2981, "step": 26634 }, { "epoch": 0.73, "learning_rate": 3.6509832649865475e-06, "loss": 1.218, "step": 26635 }, { "epoch": 0.73, "learning_rate": 3.6502999258013695e-06, "loss": 1.2441, "step": 26636 }, { "epoch": 0.73, "learning_rate": 3.649616636293266e-06, "loss": 1.3071, "step": 26637 }, { "epoch": 0.73, "learning_rate": 3.6489333964675697e-06, "loss": 1.3481, "step": 26638 }, { "epoch": 0.73, "learning_rate": 3.648250206329634e-06, "loss": 1.3257, "step": 26639 }, { "epoch": 0.73, "learning_rate": 3.6475670658848008e-06, "loss": 1.3325, "step": 26640 }, { "epoch": 0.73, "learning_rate": 3.646883975138421e-06, "loss": 1.3479, "step": 26641 }, { "epoch": 0.73, "learning_rate": 3.646200934095827e-06, "loss": 1.3667, "step": 26642 }, { "epoch": 0.73, "learning_rate": 3.645517942762372e-06, "loss": 1.3369, "step": 26643 }, { "epoch": 0.73, "learning_rate": 3.6448350011433943e-06, "loss": 1.2271, "step": 26644 }, { "epoch": 0.73, "learning_rate": 3.644152109244241e-06, "loss": 1.6099, "step": 26645 }, { "epoch": 0.73, "learning_rate": 3.643469267070254e-06, "loss": 1.1322, "step": 26646 }, { "epoch": 0.73, "learning_rate": 3.6427864746267717e-06, "loss": 1.2808, "step": 26647 }, { "epoch": 0.73, "learning_rate": 3.642103731919141e-06, "loss": 1.3313, "step": 26648 }, { "epoch": 0.73, "learning_rate": 3.6414210389527006e-06, "loss": 1.3706, "step": 26649 }, { "epoch": 0.73, "learning_rate": 3.6407383957327925e-06, "loss": 1.343, "step": 26650 }, { "epoch": 0.73, "learning_rate": 3.6400558022647538e-06, "loss": 1.4351, "step": 26651 }, { "epoch": 0.73, "learning_rate": 3.6393732585539308e-06, "loss": 1.1725, "step": 26652 }, { "epoch": 0.73, "learning_rate": 3.6386907646056603e-06, "loss": 1.2864, "step": 26653 }, { "epoch": 0.73, "learning_rate": 3.6380083204252824e-06, "loss": 1.2112, "step": 26654 }, { "epoch": 0.73, "learning_rate": 3.6373259260181317e-06, "loss": 1.2808, "step": 26655 }, { "epoch": 0.73, "learning_rate": 3.636643581389555e-06, "loss": 1.2275, "step": 26656 }, { "epoch": 0.73, "learning_rate": 3.635961286544887e-06, "loss": 1.1887, "step": 26657 }, { "epoch": 0.73, "learning_rate": 3.6352790414894646e-06, "loss": 1.2734, "step": 26658 }, { "epoch": 0.73, "learning_rate": 3.6345968462286228e-06, "loss": 1.3237, "step": 26659 }, { "epoch": 0.73, "learning_rate": 3.6339147007677058e-06, "loss": 1.2285, "step": 26660 }, { "epoch": 0.73, "learning_rate": 3.633232605112047e-06, "loss": 1.3906, "step": 26661 }, { "epoch": 0.73, "learning_rate": 3.6325505592669785e-06, "loss": 1.2908, "step": 26662 }, { "epoch": 0.73, "learning_rate": 3.6318685632378438e-06, "loss": 1.228, "step": 26663 }, { "epoch": 0.73, "learning_rate": 3.6311866170299736e-06, "loss": 1.2905, "step": 26664 }, { "epoch": 0.73, "learning_rate": 3.6305047206487065e-06, "loss": 1.3, "step": 26665 }, { "epoch": 0.73, "learning_rate": 3.6298228740993702e-06, "loss": 1.1519, "step": 26666 }, { "epoch": 0.73, "learning_rate": 3.629141077387309e-06, "loss": 1.2678, "step": 26667 }, { "epoch": 0.73, "learning_rate": 3.6284593305178515e-06, "loss": 1.2285, "step": 26668 }, { "epoch": 0.73, "learning_rate": 3.627777633496332e-06, "loss": 1.731, "step": 26669 }, { "epoch": 0.73, "learning_rate": 3.6270959863280817e-06, "loss": 1.167, "step": 26670 }, { "epoch": 0.73, "learning_rate": 3.626414389018438e-06, "loss": 1.3938, "step": 26671 }, { "epoch": 0.73, "learning_rate": 3.625732841572731e-06, "loss": 1.4211, "step": 26672 }, { "epoch": 0.73, "learning_rate": 3.6250513439962933e-06, "loss": 1.1655, "step": 26673 }, { "epoch": 0.73, "learning_rate": 3.624369896294453e-06, "loss": 1.2029, "step": 26674 }, { "epoch": 0.73, "learning_rate": 3.6236884984725475e-06, "loss": 1.3403, "step": 26675 }, { "epoch": 0.73, "learning_rate": 3.6230071505359044e-06, "loss": 1.136, "step": 26676 }, { "epoch": 0.73, "learning_rate": 3.622325852489852e-06, "loss": 1.3516, "step": 26677 }, { "epoch": 0.73, "learning_rate": 3.6216446043397256e-06, "loss": 1.2156, "step": 26678 }, { "epoch": 0.73, "learning_rate": 3.6209634060908504e-06, "loss": 1.4062, "step": 26679 }, { "epoch": 0.73, "learning_rate": 3.6202822577485643e-06, "loss": 1.2285, "step": 26680 }, { "epoch": 0.73, "learning_rate": 3.6196011593181825e-06, "loss": 1.2458, "step": 26681 }, { "epoch": 0.73, "learning_rate": 3.6189201108050443e-06, "loss": 1.2585, "step": 26682 }, { "epoch": 0.73, "learning_rate": 3.618239112214472e-06, "loss": 1.1611, "step": 26683 }, { "epoch": 0.73, "learning_rate": 3.617558163551802e-06, "loss": 1.6646, "step": 26684 }, { "epoch": 0.73, "learning_rate": 3.6168772648223493e-06, "loss": 1.2463, "step": 26685 }, { "epoch": 0.73, "learning_rate": 3.616196416031451e-06, "loss": 1.2942, "step": 26686 }, { "epoch": 0.73, "learning_rate": 3.6155156171844263e-06, "loss": 1.1519, "step": 26687 }, { "epoch": 0.73, "learning_rate": 3.6148348682866118e-06, "loss": 1.2161, "step": 26688 }, { "epoch": 0.73, "learning_rate": 3.6141541693433204e-06, "loss": 1.3992, "step": 26689 }, { "epoch": 0.73, "learning_rate": 3.613473520359887e-06, "loss": 1.3079, "step": 26690 }, { "epoch": 0.73, "learning_rate": 3.61279292134163e-06, "loss": 1.2634, "step": 26691 }, { "epoch": 0.73, "learning_rate": 3.6121123722938824e-06, "loss": 1.3506, "step": 26692 }, { "epoch": 0.73, "learning_rate": 3.611431873221962e-06, "loss": 1.3579, "step": 26693 }, { "epoch": 0.73, "learning_rate": 3.6107514241311925e-06, "loss": 1.2832, "step": 26694 }, { "epoch": 0.73, "learning_rate": 3.6100710250269024e-06, "loss": 1.2219, "step": 26695 }, { "epoch": 0.73, "learning_rate": 3.6093906759144113e-06, "loss": 1.2439, "step": 26696 }, { "epoch": 0.73, "learning_rate": 3.608710376799043e-06, "loss": 1.3462, "step": 26697 }, { "epoch": 0.73, "learning_rate": 3.6080301276861163e-06, "loss": 1.3315, "step": 26698 }, { "epoch": 0.73, "learning_rate": 3.6073499285809587e-06, "loss": 1.3489, "step": 26699 }, { "epoch": 0.73, "learning_rate": 3.6066697794888895e-06, "loss": 1.3445, "step": 26700 }, { "epoch": 0.73, "learning_rate": 3.6059896804152296e-06, "loss": 1.2844, "step": 26701 }, { "epoch": 0.73, "learning_rate": 3.605309631365297e-06, "loss": 1.3535, "step": 26702 }, { "epoch": 0.73, "learning_rate": 3.6046296323444172e-06, "loss": 1.1316, "step": 26703 }, { "epoch": 0.73, "learning_rate": 3.603949683357909e-06, "loss": 1.2375, "step": 26704 }, { "epoch": 0.73, "learning_rate": 3.6032697844110896e-06, "loss": 1.2673, "step": 26705 }, { "epoch": 0.73, "learning_rate": 3.6025899355092773e-06, "loss": 1.3171, "step": 26706 }, { "epoch": 0.73, "learning_rate": 3.6019101366577957e-06, "loss": 1.3501, "step": 26707 }, { "epoch": 0.73, "learning_rate": 3.6012303878619604e-06, "loss": 1.2261, "step": 26708 }, { "epoch": 0.73, "learning_rate": 3.6005506891270868e-06, "loss": 1.2971, "step": 26709 }, { "epoch": 0.73, "learning_rate": 3.599871040458498e-06, "loss": 1.4126, "step": 26710 }, { "epoch": 0.73, "learning_rate": 3.599191441861509e-06, "loss": 1.3044, "step": 26711 }, { "epoch": 0.73, "learning_rate": 3.5985118933414375e-06, "loss": 1.147, "step": 26712 }, { "epoch": 0.73, "learning_rate": 3.597832394903594e-06, "loss": 1.0637, "step": 26713 }, { "epoch": 0.73, "learning_rate": 3.597152946553303e-06, "loss": 1.2166, "step": 26714 }, { "epoch": 0.73, "learning_rate": 3.5964735482958766e-06, "loss": 1.4341, "step": 26715 }, { "epoch": 0.73, "learning_rate": 3.59579420013663e-06, "loss": 1.3555, "step": 26716 }, { "epoch": 0.73, "learning_rate": 3.5951149020808753e-06, "loss": 1.2881, "step": 26717 }, { "epoch": 0.73, "learning_rate": 3.5944356541339322e-06, "loss": 1.1462, "step": 26718 }, { "epoch": 0.73, "learning_rate": 3.593756456301113e-06, "loss": 1.3171, "step": 26719 }, { "epoch": 0.73, "learning_rate": 3.59307730858773e-06, "loss": 1.2905, "step": 26720 }, { "epoch": 0.73, "learning_rate": 3.592398210999095e-06, "loss": 1.3147, "step": 26721 }, { "epoch": 0.73, "learning_rate": 3.5917191635405222e-06, "loss": 1.24, "step": 26722 }, { "epoch": 0.73, "learning_rate": 3.5910401662173332e-06, "loss": 1.2642, "step": 26723 }, { "epoch": 0.73, "learning_rate": 3.5903612190348258e-06, "loss": 0.9481, "step": 26724 }, { "epoch": 0.73, "learning_rate": 3.58968232199832e-06, "loss": 1.229, "step": 26725 }, { "epoch": 0.73, "learning_rate": 3.5890034751131232e-06, "loss": 1.3123, "step": 26726 }, { "epoch": 0.73, "learning_rate": 3.588324678384555e-06, "loss": 1.1758, "step": 26727 }, { "epoch": 0.73, "learning_rate": 3.5876459318179137e-06, "loss": 1.1643, "step": 26728 }, { "epoch": 0.73, "learning_rate": 3.586967235418517e-06, "loss": 1.2173, "step": 26729 }, { "epoch": 0.73, "learning_rate": 3.586288589191671e-06, "loss": 1.3201, "step": 26730 }, { "epoch": 0.73, "learning_rate": 3.5856099931426935e-06, "loss": 1.2168, "step": 26731 }, { "epoch": 0.73, "learning_rate": 3.5849314472768803e-06, "loss": 1.3447, "step": 26732 }, { "epoch": 0.73, "learning_rate": 3.5842529515995497e-06, "loss": 1.3308, "step": 26733 }, { "epoch": 0.73, "learning_rate": 3.5835745061160045e-06, "loss": 1.249, "step": 26734 }, { "epoch": 0.73, "learning_rate": 3.582896110831562e-06, "loss": 1.459, "step": 26735 }, { "epoch": 0.73, "learning_rate": 3.5822177657515157e-06, "loss": 1.2864, "step": 26736 }, { "epoch": 0.73, "learning_rate": 3.5815394708811825e-06, "loss": 1.2214, "step": 26737 }, { "epoch": 0.73, "learning_rate": 3.5808612262258635e-06, "loss": 1.0791, "step": 26738 }, { "epoch": 0.73, "learning_rate": 3.5801830317908713e-06, "loss": 1.1406, "step": 26739 }, { "epoch": 0.73, "learning_rate": 3.5795048875815087e-06, "loss": 1.2837, "step": 26740 }, { "epoch": 0.73, "learning_rate": 3.5788267936030765e-06, "loss": 1.1887, "step": 26741 }, { "epoch": 0.73, "learning_rate": 3.578148749860887e-06, "loss": 1.4155, "step": 26742 }, { "epoch": 0.73, "learning_rate": 3.577470756360243e-06, "loss": 1.1946, "step": 26743 }, { "epoch": 0.73, "learning_rate": 3.5767928131064478e-06, "loss": 1.3025, "step": 26744 }, { "epoch": 0.73, "learning_rate": 3.5761149201048007e-06, "loss": 1.3215, "step": 26745 }, { "epoch": 0.73, "learning_rate": 3.575437077360614e-06, "loss": 1.3242, "step": 26746 }, { "epoch": 0.73, "learning_rate": 3.574759284879187e-06, "loss": 1.2971, "step": 26747 }, { "epoch": 0.73, "learning_rate": 3.5740815426658204e-06, "loss": 1.2927, "step": 26748 }, { "epoch": 0.73, "learning_rate": 3.5734038507258163e-06, "loss": 0.9875, "step": 26749 }, { "epoch": 0.73, "learning_rate": 3.572726209064481e-06, "loss": 1.6895, "step": 26750 }, { "epoch": 0.73, "learning_rate": 3.572048617687114e-06, "loss": 1.2881, "step": 26751 }, { "epoch": 0.73, "learning_rate": 3.571371076599015e-06, "loss": 1.3032, "step": 26752 }, { "epoch": 0.73, "learning_rate": 3.5706935858054837e-06, "loss": 1.1992, "step": 26753 }, { "epoch": 0.73, "learning_rate": 3.5700161453118256e-06, "loss": 1.3904, "step": 26754 }, { "epoch": 0.73, "learning_rate": 3.5693387551233373e-06, "loss": 1.1882, "step": 26755 }, { "epoch": 0.73, "learning_rate": 3.568661415245315e-06, "loss": 1.7305, "step": 26756 }, { "epoch": 0.73, "learning_rate": 3.567984125683065e-06, "loss": 1.2458, "step": 26757 }, { "epoch": 0.73, "learning_rate": 3.5673068864418826e-06, "loss": 1.3533, "step": 26758 }, { "epoch": 0.73, "learning_rate": 3.5666296975270666e-06, "loss": 1.4065, "step": 26759 }, { "epoch": 0.73, "learning_rate": 3.5659525589439114e-06, "loss": 1.5884, "step": 26760 }, { "epoch": 0.73, "learning_rate": 3.565275470697721e-06, "loss": 1.2173, "step": 26761 }, { "epoch": 0.73, "learning_rate": 3.56459843279379e-06, "loss": 1.7275, "step": 26762 }, { "epoch": 0.73, "learning_rate": 3.5639214452374137e-06, "loss": 1.3154, "step": 26763 }, { "epoch": 0.73, "learning_rate": 3.5632445080338874e-06, "loss": 1.1963, "step": 26764 }, { "epoch": 0.73, "learning_rate": 3.562567621188512e-06, "loss": 1.291, "step": 26765 }, { "epoch": 0.73, "learning_rate": 3.56189078470658e-06, "loss": 1.22, "step": 26766 }, { "epoch": 0.73, "learning_rate": 3.561213998593388e-06, "loss": 1.2278, "step": 26767 }, { "epoch": 0.73, "learning_rate": 3.5605372628542254e-06, "loss": 1.1946, "step": 26768 }, { "epoch": 0.73, "learning_rate": 3.559860577494393e-06, "loss": 1.2688, "step": 26769 }, { "epoch": 0.73, "learning_rate": 3.5591839425191886e-06, "loss": 1.45, "step": 26770 }, { "epoch": 0.73, "learning_rate": 3.5585073579338934e-06, "loss": 1.27, "step": 26771 }, { "epoch": 0.73, "learning_rate": 3.5578308237438107e-06, "loss": 1.3142, "step": 26772 }, { "epoch": 0.73, "learning_rate": 3.5571543399542284e-06, "loss": 1.1682, "step": 26773 }, { "epoch": 0.73, "learning_rate": 3.556477906570447e-06, "loss": 1.2766, "step": 26774 }, { "epoch": 0.73, "learning_rate": 3.555801523597745e-06, "loss": 1.3567, "step": 26775 }, { "epoch": 0.73, "learning_rate": 3.5551251910414263e-06, "loss": 1.2, "step": 26776 }, { "epoch": 0.73, "learning_rate": 3.5544489089067735e-06, "loss": 1.718, "step": 26777 }, { "epoch": 0.73, "learning_rate": 3.5537726771990875e-06, "loss": 1.2549, "step": 26778 }, { "epoch": 0.73, "learning_rate": 3.553096495923647e-06, "loss": 1.2109, "step": 26779 }, { "epoch": 0.73, "learning_rate": 3.5524203650857512e-06, "loss": 1.2114, "step": 26780 }, { "epoch": 0.73, "learning_rate": 3.5517442846906837e-06, "loss": 1.4082, "step": 26781 }, { "epoch": 0.73, "learning_rate": 3.551068254743739e-06, "loss": 1.4395, "step": 26782 }, { "epoch": 0.73, "learning_rate": 3.550392275250204e-06, "loss": 1.324, "step": 26783 }, { "epoch": 0.73, "learning_rate": 3.5497163462153648e-06, "loss": 1.5098, "step": 26784 }, { "epoch": 0.73, "learning_rate": 3.5490404676445143e-06, "loss": 1.4131, "step": 26785 }, { "epoch": 0.73, "learning_rate": 3.548364639542937e-06, "loss": 1.3135, "step": 26786 }, { "epoch": 0.73, "learning_rate": 3.5476888619159222e-06, "loss": 1.1423, "step": 26787 }, { "epoch": 0.73, "learning_rate": 3.547013134768752e-06, "loss": 1.3108, "step": 26788 }, { "epoch": 0.73, "learning_rate": 3.54633745810672e-06, "loss": 1.0786, "step": 26789 }, { "epoch": 0.73, "learning_rate": 3.5456618319351086e-06, "loss": 1.2285, "step": 26790 }, { "epoch": 0.73, "learning_rate": 3.544986256259204e-06, "loss": 1.1597, "step": 26791 }, { "epoch": 0.73, "learning_rate": 3.5443107310842884e-06, "loss": 1.3037, "step": 26792 }, { "epoch": 0.73, "learning_rate": 3.543635256415654e-06, "loss": 1.1321, "step": 26793 }, { "epoch": 0.73, "learning_rate": 3.5429598322585803e-06, "loss": 1.3059, "step": 26794 }, { "epoch": 0.73, "learning_rate": 3.5422844586183536e-06, "loss": 1.3162, "step": 26795 }, { "epoch": 0.73, "learning_rate": 3.5416091355002525e-06, "loss": 1.2666, "step": 26796 }, { "epoch": 0.73, "learning_rate": 3.5409338629095678e-06, "loss": 1.1826, "step": 26797 }, { "epoch": 0.73, "learning_rate": 3.5402586408515795e-06, "loss": 1.1719, "step": 26798 }, { "epoch": 0.73, "learning_rate": 3.5395834693315702e-06, "loss": 1.2942, "step": 26799 }, { "epoch": 0.73, "learning_rate": 3.538908348354818e-06, "loss": 1.1538, "step": 26800 }, { "epoch": 0.73, "learning_rate": 3.5382332779266127e-06, "loss": 1.1897, "step": 26801 }, { "epoch": 0.73, "learning_rate": 3.5375582580522317e-06, "loss": 1.2593, "step": 26802 }, { "epoch": 0.73, "learning_rate": 3.536883288736953e-06, "loss": 1.3318, "step": 26803 }, { "epoch": 0.73, "learning_rate": 3.5362083699860627e-06, "loss": 1.2568, "step": 26804 }, { "epoch": 0.73, "learning_rate": 3.5355335018048386e-06, "loss": 1.1836, "step": 26805 }, { "epoch": 0.73, "learning_rate": 3.534858684198561e-06, "loss": 1.218, "step": 26806 }, { "epoch": 0.73, "learning_rate": 3.5341839171725054e-06, "loss": 1.3005, "step": 26807 }, { "epoch": 0.73, "learning_rate": 3.533509200731958e-06, "loss": 1.2275, "step": 26808 }, { "epoch": 0.73, "learning_rate": 3.5328345348821945e-06, "loss": 1.2812, "step": 26809 }, { "epoch": 0.73, "learning_rate": 3.532159919628492e-06, "loss": 1.1332, "step": 26810 }, { "epoch": 0.73, "learning_rate": 3.531485354976125e-06, "loss": 1.343, "step": 26811 }, { "epoch": 0.73, "learning_rate": 3.5308108409303785e-06, "loss": 1.3293, "step": 26812 }, { "epoch": 0.73, "learning_rate": 3.5301363774965256e-06, "loss": 1.1958, "step": 26813 }, { "epoch": 0.73, "learning_rate": 3.5294619646798447e-06, "loss": 1.1062, "step": 26814 }, { "epoch": 0.73, "learning_rate": 3.5287876024856062e-06, "loss": 1.2285, "step": 26815 }, { "epoch": 0.73, "learning_rate": 3.5281132909190908e-06, "loss": 1.1826, "step": 26816 }, { "epoch": 0.73, "learning_rate": 3.5274390299855765e-06, "loss": 1.2786, "step": 26817 }, { "epoch": 0.73, "learning_rate": 3.526764819690337e-06, "loss": 1.2849, "step": 26818 }, { "epoch": 0.73, "learning_rate": 3.5260906600386446e-06, "loss": 1.0598, "step": 26819 }, { "epoch": 0.73, "learning_rate": 3.525416551035771e-06, "loss": 1.354, "step": 26820 }, { "epoch": 0.73, "learning_rate": 3.524742492686998e-06, "loss": 1.2949, "step": 26821 }, { "epoch": 0.73, "learning_rate": 3.5240684849975946e-06, "loss": 1.2305, "step": 26822 }, { "epoch": 0.73, "learning_rate": 3.523394527972833e-06, "loss": 1.3657, "step": 26823 }, { "epoch": 0.73, "learning_rate": 3.5227206216179854e-06, "loss": 1.396, "step": 26824 }, { "epoch": 0.73, "learning_rate": 3.5220467659383283e-06, "loss": 1.3694, "step": 26825 }, { "epoch": 0.73, "learning_rate": 3.5213729609391313e-06, "loss": 1.2695, "step": 26826 }, { "epoch": 0.73, "learning_rate": 3.5206992066256663e-06, "loss": 1.3728, "step": 26827 }, { "epoch": 0.73, "learning_rate": 3.5200255030032006e-06, "loss": 1.3286, "step": 26828 }, { "epoch": 0.73, "learning_rate": 3.5193518500770107e-06, "loss": 1.0354, "step": 26829 }, { "epoch": 0.73, "learning_rate": 3.5186782478523653e-06, "loss": 1.4033, "step": 26830 }, { "epoch": 0.73, "learning_rate": 3.5180046963345294e-06, "loss": 1.252, "step": 26831 }, { "epoch": 0.73, "learning_rate": 3.51733119552878e-06, "loss": 1.2468, "step": 26832 }, { "epoch": 0.73, "learning_rate": 3.516657745440384e-06, "loss": 1.1455, "step": 26833 }, { "epoch": 0.73, "learning_rate": 3.515984346074609e-06, "loss": 1.2241, "step": 26834 }, { "epoch": 0.73, "learning_rate": 3.5153109974367196e-06, "loss": 1.1904, "step": 26835 }, { "epoch": 0.73, "learning_rate": 3.5146376995319907e-06, "loss": 1.2683, "step": 26836 }, { "epoch": 0.73, "learning_rate": 3.513964452365688e-06, "loss": 1.3035, "step": 26837 }, { "epoch": 0.73, "learning_rate": 3.5132912559430764e-06, "loss": 1.1687, "step": 26838 }, { "epoch": 0.73, "learning_rate": 3.5126181102694203e-06, "loss": 1.1907, "step": 26839 }, { "epoch": 0.73, "learning_rate": 3.5119450153499933e-06, "loss": 1.394, "step": 26840 }, { "epoch": 0.73, "learning_rate": 3.511271971190058e-06, "loss": 1.3018, "step": 26841 }, { "epoch": 0.73, "learning_rate": 3.510598977794879e-06, "loss": 1.3123, "step": 26842 }, { "epoch": 0.73, "learning_rate": 3.5099260351697185e-06, "loss": 1.0969, "step": 26843 }, { "epoch": 0.73, "learning_rate": 3.5092531433198485e-06, "loss": 1.3235, "step": 26844 }, { "epoch": 0.73, "learning_rate": 3.5085803022505304e-06, "loss": 1.1848, "step": 26845 }, { "epoch": 0.73, "learning_rate": 3.5079075119670238e-06, "loss": 1.3738, "step": 26846 }, { "epoch": 0.73, "learning_rate": 3.5072347724745993e-06, "loss": 1.2744, "step": 26847 }, { "epoch": 0.73, "learning_rate": 3.506562083778513e-06, "loss": 1.3062, "step": 26848 }, { "epoch": 0.73, "learning_rate": 3.505889445884039e-06, "loss": 1.1973, "step": 26849 }, { "epoch": 0.73, "learning_rate": 3.5052168587964243e-06, "loss": 1.3643, "step": 26850 }, { "epoch": 0.73, "learning_rate": 3.504544322520943e-06, "loss": 1.2959, "step": 26851 }, { "epoch": 0.73, "learning_rate": 3.50387183706285e-06, "loss": 1.4194, "step": 26852 }, { "epoch": 0.73, "learning_rate": 3.503199402427414e-06, "loss": 1.3018, "step": 26853 }, { "epoch": 0.73, "learning_rate": 3.5025270186198857e-06, "loss": 1.2886, "step": 26854 }, { "epoch": 0.73, "learning_rate": 3.5018546856455337e-06, "loss": 1.3674, "step": 26855 }, { "epoch": 0.73, "learning_rate": 3.501182403509611e-06, "loss": 1.3887, "step": 26856 }, { "epoch": 0.73, "learning_rate": 3.5005101722173883e-06, "loss": 1.2891, "step": 26857 }, { "epoch": 0.73, "learning_rate": 3.499837991774111e-06, "loss": 1.2056, "step": 26858 }, { "epoch": 0.73, "learning_rate": 3.499165862185048e-06, "loss": 1.2756, "step": 26859 }, { "epoch": 0.73, "learning_rate": 3.498493783455451e-06, "loss": 1.3418, "step": 26860 }, { "epoch": 0.73, "learning_rate": 3.497821755590588e-06, "loss": 1.2563, "step": 26861 }, { "epoch": 0.73, "learning_rate": 3.497149778595704e-06, "loss": 1.176, "step": 26862 }, { "epoch": 0.73, "learning_rate": 3.496477852476062e-06, "loss": 1.2153, "step": 26863 }, { "epoch": 0.73, "learning_rate": 3.4958059772369223e-06, "loss": 1.198, "step": 26864 }, { "epoch": 0.73, "learning_rate": 3.495134152883538e-06, "loss": 0.9937, "step": 26865 }, { "epoch": 0.73, "learning_rate": 3.4944623794211653e-06, "loss": 1.2927, "step": 26866 }, { "epoch": 0.73, "learning_rate": 3.493790656855057e-06, "loss": 1.3596, "step": 26867 }, { "epoch": 0.73, "learning_rate": 3.4931189851904734e-06, "loss": 1.2678, "step": 26868 }, { "epoch": 0.73, "learning_rate": 3.4924473644326683e-06, "loss": 1.2795, "step": 26869 }, { "epoch": 0.73, "learning_rate": 3.4917757945868946e-06, "loss": 1.3511, "step": 26870 }, { "epoch": 0.73, "learning_rate": 3.4911042756584036e-06, "loss": 1.3691, "step": 26871 }, { "epoch": 0.73, "learning_rate": 3.4904328076524553e-06, "loss": 1.2356, "step": 26872 }, { "epoch": 0.73, "learning_rate": 3.489761390574299e-06, "loss": 1.1953, "step": 26873 }, { "epoch": 0.73, "learning_rate": 3.489090024429188e-06, "loss": 1.2629, "step": 26874 }, { "epoch": 0.73, "learning_rate": 3.488418709222373e-06, "loss": 1.2861, "step": 26875 }, { "epoch": 0.73, "learning_rate": 3.487747444959111e-06, "loss": 1.2024, "step": 26876 }, { "epoch": 0.73, "learning_rate": 3.4870762316446504e-06, "loss": 1.3115, "step": 26877 }, { "epoch": 0.73, "learning_rate": 3.4864050692842387e-06, "loss": 1.2844, "step": 26878 }, { "epoch": 0.73, "learning_rate": 3.485733957883135e-06, "loss": 1.2559, "step": 26879 }, { "epoch": 0.73, "learning_rate": 3.485062897446586e-06, "loss": 1.2988, "step": 26880 }, { "epoch": 0.73, "learning_rate": 3.484391887979841e-06, "loss": 1.2993, "step": 26881 }, { "epoch": 0.73, "learning_rate": 3.483720929488147e-06, "loss": 1.2732, "step": 26882 }, { "epoch": 0.73, "learning_rate": 3.483050021976758e-06, "loss": 1.0977, "step": 26883 }, { "epoch": 0.73, "learning_rate": 3.482379165450923e-06, "loss": 1.1433, "step": 26884 }, { "epoch": 0.73, "learning_rate": 3.4817083599158874e-06, "loss": 1.2747, "step": 26885 }, { "epoch": 0.73, "learning_rate": 3.481037605376898e-06, "loss": 1.4009, "step": 26886 }, { "epoch": 0.73, "learning_rate": 3.4803669018392083e-06, "loss": 1.3547, "step": 26887 }, { "epoch": 0.73, "learning_rate": 3.4796962493080622e-06, "loss": 1.0171, "step": 26888 }, { "epoch": 0.73, "learning_rate": 3.4790256477887063e-06, "loss": 1.2834, "step": 26889 }, { "epoch": 0.73, "learning_rate": 3.478355097286383e-06, "loss": 1.2996, "step": 26890 }, { "epoch": 0.73, "learning_rate": 3.477684597806348e-06, "loss": 1.6401, "step": 26891 }, { "epoch": 0.73, "learning_rate": 3.4770141493538403e-06, "loss": 1.2773, "step": 26892 }, { "epoch": 0.73, "learning_rate": 3.4763437519341038e-06, "loss": 1.2246, "step": 26893 }, { "epoch": 0.73, "learning_rate": 3.4756734055523887e-06, "loss": 1.116, "step": 26894 }, { "epoch": 0.73, "learning_rate": 3.475003110213935e-06, "loss": 1.0237, "step": 26895 }, { "epoch": 0.73, "learning_rate": 3.474332865923994e-06, "loss": 1.342, "step": 26896 }, { "epoch": 0.73, "learning_rate": 3.473662672687799e-06, "loss": 1.3828, "step": 26897 }, { "epoch": 0.73, "learning_rate": 3.4729925305106006e-06, "loss": 1.2209, "step": 26898 }, { "epoch": 0.73, "learning_rate": 3.4723224393976353e-06, "loss": 1.3289, "step": 26899 }, { "epoch": 0.73, "learning_rate": 3.471652399354157e-06, "loss": 1.1335, "step": 26900 }, { "epoch": 0.73, "learning_rate": 3.470982410385395e-06, "loss": 1.373, "step": 26901 }, { "epoch": 0.73, "learning_rate": 3.4703124724965984e-06, "loss": 1.3613, "step": 26902 }, { "epoch": 0.73, "learning_rate": 3.469642585693004e-06, "loss": 1.3118, "step": 26903 }, { "epoch": 0.73, "learning_rate": 3.468972749979862e-06, "loss": 1.1619, "step": 26904 }, { "epoch": 0.73, "learning_rate": 3.4683029653623988e-06, "loss": 1.3594, "step": 26905 }, { "epoch": 0.73, "learning_rate": 3.467633231845865e-06, "loss": 1.3857, "step": 26906 }, { "epoch": 0.73, "learning_rate": 3.4669635494354938e-06, "loss": 1.3691, "step": 26907 }, { "epoch": 0.73, "learning_rate": 3.466293918136532e-06, "loss": 1.2761, "step": 26908 }, { "epoch": 0.73, "learning_rate": 3.465624337954213e-06, "loss": 1.3296, "step": 26909 }, { "epoch": 0.73, "learning_rate": 3.4649548088937733e-06, "loss": 1.3037, "step": 26910 }, { "epoch": 0.73, "learning_rate": 3.4642853309604587e-06, "loss": 1.1924, "step": 26911 }, { "epoch": 0.73, "learning_rate": 3.463615904159501e-06, "loss": 1.2686, "step": 26912 }, { "epoch": 0.73, "learning_rate": 3.4629465284961395e-06, "loss": 1.252, "step": 26913 }, { "epoch": 0.74, "learning_rate": 3.462277203975607e-06, "loss": 1.2422, "step": 26914 }, { "epoch": 0.74, "learning_rate": 3.461607930603147e-06, "loss": 1.344, "step": 26915 }, { "epoch": 0.74, "learning_rate": 3.460938708383992e-06, "loss": 1.6626, "step": 26916 }, { "epoch": 0.74, "learning_rate": 3.4602695373233773e-06, "loss": 1.1917, "step": 26917 }, { "epoch": 0.74, "learning_rate": 3.4596004174265353e-06, "loss": 1.1819, "step": 26918 }, { "epoch": 0.74, "learning_rate": 3.4589313486987076e-06, "loss": 1.3037, "step": 26919 }, { "epoch": 0.74, "learning_rate": 3.4582623311451245e-06, "loss": 1.4342, "step": 26920 }, { "epoch": 0.74, "learning_rate": 3.4575933647710213e-06, "loss": 1.1716, "step": 26921 }, { "epoch": 0.74, "learning_rate": 3.456924449581628e-06, "loss": 1.2178, "step": 26922 }, { "epoch": 0.74, "learning_rate": 3.4562555855821844e-06, "loss": 1.2842, "step": 26923 }, { "epoch": 0.74, "learning_rate": 3.45558677277792e-06, "loss": 1.269, "step": 26924 }, { "epoch": 0.74, "learning_rate": 3.454918011174063e-06, "loss": 1.2781, "step": 26925 }, { "epoch": 0.74, "learning_rate": 3.4542493007758547e-06, "loss": 1.2622, "step": 26926 }, { "epoch": 0.74, "learning_rate": 3.453580641588521e-06, "loss": 1.3298, "step": 26927 }, { "epoch": 0.74, "learning_rate": 3.452912033617294e-06, "loss": 1.1394, "step": 26928 }, { "epoch": 0.74, "learning_rate": 3.4522434768674006e-06, "loss": 1.178, "step": 26929 }, { "epoch": 0.74, "learning_rate": 3.4515749713440793e-06, "loss": 1.2881, "step": 26930 }, { "epoch": 0.74, "learning_rate": 3.450906517052557e-06, "loss": 1.2969, "step": 26931 }, { "epoch": 0.74, "learning_rate": 3.450238113998061e-06, "loss": 1.3091, "step": 26932 }, { "epoch": 0.74, "learning_rate": 3.4495697621858193e-06, "loss": 1.3232, "step": 26933 }, { "epoch": 0.74, "learning_rate": 3.448901461621067e-06, "loss": 1.1938, "step": 26934 }, { "epoch": 0.74, "learning_rate": 3.44823321230903e-06, "loss": 1.3931, "step": 26935 }, { "epoch": 0.74, "learning_rate": 3.4475650142549342e-06, "loss": 1.2048, "step": 26936 }, { "epoch": 0.74, "learning_rate": 3.4468968674640057e-06, "loss": 1.3677, "step": 26937 }, { "epoch": 0.74, "learning_rate": 3.4462287719414775e-06, "loss": 1.1873, "step": 26938 }, { "epoch": 0.74, "learning_rate": 3.445560727692574e-06, "loss": 1.269, "step": 26939 }, { "epoch": 0.74, "learning_rate": 3.444892734722518e-06, "loss": 1.1882, "step": 26940 }, { "epoch": 0.74, "learning_rate": 3.4442247930365423e-06, "loss": 1.7998, "step": 26941 }, { "epoch": 0.74, "learning_rate": 3.4435569026398653e-06, "loss": 1.3245, "step": 26942 }, { "epoch": 0.74, "learning_rate": 3.442889063537723e-06, "loss": 1.2073, "step": 26943 }, { "epoch": 0.74, "learning_rate": 3.4422212757353267e-06, "loss": 1.75, "step": 26944 }, { "epoch": 0.74, "learning_rate": 3.4415535392379107e-06, "loss": 1.2896, "step": 26945 }, { "epoch": 0.74, "learning_rate": 3.4408858540506916e-06, "loss": 0.9629, "step": 26946 }, { "epoch": 0.74, "learning_rate": 3.440218220178905e-06, "loss": 1.2332, "step": 26947 }, { "epoch": 0.74, "learning_rate": 3.43955063762776e-06, "loss": 1.2871, "step": 26948 }, { "epoch": 0.74, "learning_rate": 3.4388831064024886e-06, "loss": 1.3804, "step": 26949 }, { "epoch": 0.74, "learning_rate": 3.4382156265083067e-06, "loss": 1.2832, "step": 26950 }, { "epoch": 0.74, "learning_rate": 3.4375481979504476e-06, "loss": 1.3191, "step": 26951 }, { "epoch": 0.74, "learning_rate": 3.4368808207341188e-06, "loss": 1.7358, "step": 26952 }, { "epoch": 0.74, "learning_rate": 3.4362134948645507e-06, "loss": 1.3682, "step": 26953 }, { "epoch": 0.74, "learning_rate": 3.4355462203469603e-06, "loss": 1.1759, "step": 26954 }, { "epoch": 0.74, "learning_rate": 3.4348789971865716e-06, "loss": 1.2329, "step": 26955 }, { "epoch": 0.74, "learning_rate": 3.4342118253886027e-06, "loss": 1.325, "step": 26956 }, { "epoch": 0.74, "learning_rate": 3.4335447049582693e-06, "loss": 1.4119, "step": 26957 }, { "epoch": 0.74, "learning_rate": 3.4328776359007976e-06, "loss": 1.1606, "step": 26958 }, { "epoch": 0.74, "learning_rate": 3.432210618221403e-06, "loss": 1.2058, "step": 26959 }, { "epoch": 0.74, "learning_rate": 3.4315436519253053e-06, "loss": 1.1733, "step": 26960 }, { "epoch": 0.74, "learning_rate": 3.4308767370177164e-06, "loss": 1.0756, "step": 26961 }, { "epoch": 0.74, "learning_rate": 3.4302098735038634e-06, "loss": 1.3208, "step": 26962 }, { "epoch": 0.74, "learning_rate": 3.429543061388959e-06, "loss": 1.2432, "step": 26963 }, { "epoch": 0.74, "learning_rate": 3.42887630067822e-06, "loss": 1.2336, "step": 26964 }, { "epoch": 0.74, "learning_rate": 3.4282095913768587e-06, "loss": 1.2585, "step": 26965 }, { "epoch": 0.74, "learning_rate": 3.4275429334901e-06, "loss": 1.1736, "step": 26966 }, { "epoch": 0.74, "learning_rate": 3.426876327023154e-06, "loss": 1.1514, "step": 26967 }, { "epoch": 0.74, "learning_rate": 3.426209771981237e-06, "loss": 1.1825, "step": 26968 }, { "epoch": 0.74, "learning_rate": 3.42554326836956e-06, "loss": 1.3452, "step": 26969 }, { "epoch": 0.74, "learning_rate": 3.4248768161933444e-06, "loss": 1.2683, "step": 26970 }, { "epoch": 0.74, "learning_rate": 3.4242104154578005e-06, "loss": 1.3145, "step": 26971 }, { "epoch": 0.74, "learning_rate": 3.4235440661681385e-06, "loss": 1.3813, "step": 26972 }, { "epoch": 0.74, "learning_rate": 3.422877768329579e-06, "loss": 1.1089, "step": 26973 }, { "epoch": 0.74, "learning_rate": 3.4222115219473308e-06, "loss": 1.2233, "step": 26974 }, { "epoch": 0.74, "learning_rate": 3.4215453270266074e-06, "loss": 1.1943, "step": 26975 }, { "epoch": 0.74, "learning_rate": 3.4208791835726164e-06, "loss": 1.1226, "step": 26976 }, { "epoch": 0.74, "learning_rate": 3.420213091590575e-06, "loss": 1.3528, "step": 26977 }, { "epoch": 0.74, "learning_rate": 3.419547051085693e-06, "loss": 1.2761, "step": 26978 }, { "epoch": 0.74, "learning_rate": 3.418881062063182e-06, "loss": 1.2729, "step": 26979 }, { "epoch": 0.74, "learning_rate": 3.4182151245282457e-06, "loss": 1.1934, "step": 26980 }, { "epoch": 0.74, "learning_rate": 3.4175492384861033e-06, "loss": 1.2678, "step": 26981 }, { "epoch": 0.74, "learning_rate": 3.4168834039419607e-06, "loss": 1.2852, "step": 26982 }, { "epoch": 0.74, "learning_rate": 3.4162176209010266e-06, "loss": 1.1921, "step": 26983 }, { "epoch": 0.74, "learning_rate": 3.4155518893685057e-06, "loss": 1.3333, "step": 26984 }, { "epoch": 0.74, "learning_rate": 3.414886209349615e-06, "loss": 1.3416, "step": 26985 }, { "epoch": 0.74, "learning_rate": 3.4142205808495575e-06, "loss": 1.4077, "step": 26986 }, { "epoch": 0.74, "learning_rate": 3.413555003873539e-06, "loss": 1.2822, "step": 26987 }, { "epoch": 0.74, "learning_rate": 3.412889478426771e-06, "loss": 1.2126, "step": 26988 }, { "epoch": 0.74, "learning_rate": 3.412224004514455e-06, "loss": 1.1917, "step": 26989 }, { "epoch": 0.74, "learning_rate": 3.4115585821418085e-06, "loss": 1.4155, "step": 26990 }, { "epoch": 0.74, "learning_rate": 3.4108932113140212e-06, "loss": 1.2769, "step": 26991 }, { "epoch": 0.74, "learning_rate": 3.410227892036312e-06, "loss": 1.2644, "step": 26992 }, { "epoch": 0.74, "learning_rate": 3.409562624313877e-06, "loss": 1.1504, "step": 26993 }, { "epoch": 0.74, "learning_rate": 3.408897408151931e-06, "loss": 1.2214, "step": 26994 }, { "epoch": 0.74, "learning_rate": 3.4082322435556667e-06, "loss": 1.2781, "step": 26995 }, { "epoch": 0.74, "learning_rate": 3.407567130530296e-06, "loss": 1.3601, "step": 26996 }, { "epoch": 0.74, "learning_rate": 3.406902069081017e-06, "loss": 1.4641, "step": 26997 }, { "epoch": 0.74, "learning_rate": 3.4062370592130436e-06, "loss": 1.3438, "step": 26998 }, { "epoch": 0.74, "learning_rate": 3.4055721009315635e-06, "loss": 1.095, "step": 26999 }, { "epoch": 0.74, "learning_rate": 3.40490719424179e-06, "loss": 1.252, "step": 27000 }, { "epoch": 0.74, "learning_rate": 3.4042423391489176e-06, "loss": 1.1079, "step": 27001 }, { "epoch": 0.74, "learning_rate": 3.4035775356581546e-06, "loss": 1.1324, "step": 27002 }, { "epoch": 0.74, "learning_rate": 3.4029127837747e-06, "loss": 1.2207, "step": 27003 }, { "epoch": 0.74, "learning_rate": 3.40224808350375e-06, "loss": 1.2776, "step": 27004 }, { "epoch": 0.74, "learning_rate": 3.4015834348505105e-06, "loss": 1.2751, "step": 27005 }, { "epoch": 0.74, "learning_rate": 3.4009188378201807e-06, "loss": 1.3218, "step": 27006 }, { "epoch": 0.74, "learning_rate": 3.400254292417959e-06, "loss": 1.4019, "step": 27007 }, { "epoch": 0.74, "learning_rate": 3.399589798649041e-06, "loss": 1.4177, "step": 27008 }, { "epoch": 0.74, "learning_rate": 3.398925356518631e-06, "loss": 1.3237, "step": 27009 }, { "epoch": 0.74, "learning_rate": 3.3982609660319253e-06, "loss": 1.2009, "step": 27010 }, { "epoch": 0.74, "learning_rate": 3.3975966271941218e-06, "loss": 1.1321, "step": 27011 }, { "epoch": 0.74, "learning_rate": 3.3969323400104147e-06, "loss": 1.1545, "step": 27012 }, { "epoch": 0.74, "learning_rate": 3.3962681044860067e-06, "loss": 1.2493, "step": 27013 }, { "epoch": 0.74, "learning_rate": 3.395603920626093e-06, "loss": 1.4414, "step": 27014 }, { "epoch": 0.74, "learning_rate": 3.394939788435867e-06, "loss": 1.157, "step": 27015 }, { "epoch": 0.74, "learning_rate": 3.3942757079205236e-06, "loss": 1.2937, "step": 27016 }, { "epoch": 0.74, "learning_rate": 3.3936116790852637e-06, "loss": 1.385, "step": 27017 }, { "epoch": 0.74, "learning_rate": 3.3929477019352797e-06, "loss": 1.2751, "step": 27018 }, { "epoch": 0.74, "learning_rate": 3.392283776475762e-06, "loss": 1.2708, "step": 27019 }, { "epoch": 0.74, "learning_rate": 3.3916199027119132e-06, "loss": 1.281, "step": 27020 }, { "epoch": 0.74, "learning_rate": 3.3909560806489227e-06, "loss": 1.1277, "step": 27021 }, { "epoch": 0.74, "learning_rate": 3.390292310291984e-06, "loss": 1.2444, "step": 27022 }, { "epoch": 0.74, "learning_rate": 3.3896285916462867e-06, "loss": 1.2891, "step": 27023 }, { "epoch": 0.74, "learning_rate": 3.38896492471703e-06, "loss": 1.3069, "step": 27024 }, { "epoch": 0.74, "learning_rate": 3.388301309509403e-06, "loss": 1.1328, "step": 27025 }, { "epoch": 0.74, "learning_rate": 3.3876377460285983e-06, "loss": 1.2993, "step": 27026 }, { "epoch": 0.74, "learning_rate": 3.3869742342798028e-06, "loss": 1.1477, "step": 27027 }, { "epoch": 0.74, "learning_rate": 3.3863107742682142e-06, "loss": 1.1711, "step": 27028 }, { "epoch": 0.74, "learning_rate": 3.3856473659990207e-06, "loss": 1.2961, "step": 27029 }, { "epoch": 0.74, "learning_rate": 3.384984009477411e-06, "loss": 1.3618, "step": 27030 }, { "epoch": 0.74, "learning_rate": 3.3843207047085736e-06, "loss": 1.3301, "step": 27031 }, { "epoch": 0.74, "learning_rate": 3.3836574516976996e-06, "loss": 1.6685, "step": 27032 }, { "epoch": 0.74, "learning_rate": 3.3829942504499847e-06, "loss": 1.4343, "step": 27033 }, { "epoch": 0.74, "learning_rate": 3.382331100970605e-06, "loss": 1.217, "step": 27034 }, { "epoch": 0.74, "learning_rate": 3.3816680032647573e-06, "loss": 1.2058, "step": 27035 }, { "epoch": 0.74, "learning_rate": 3.3810049573376248e-06, "loss": 1.3613, "step": 27036 }, { "epoch": 0.74, "learning_rate": 3.3803419631944033e-06, "loss": 1.4111, "step": 27037 }, { "epoch": 0.74, "learning_rate": 3.3796790208402674e-06, "loss": 1.2754, "step": 27038 }, { "epoch": 0.74, "learning_rate": 3.3790161302804124e-06, "loss": 1.2861, "step": 27039 }, { "epoch": 0.74, "learning_rate": 3.378353291520019e-06, "loss": 1.2903, "step": 27040 }, { "epoch": 0.74, "learning_rate": 3.3776905045642816e-06, "loss": 1.1714, "step": 27041 }, { "epoch": 0.74, "learning_rate": 3.377027769418374e-06, "loss": 1.3401, "step": 27042 }, { "epoch": 0.74, "learning_rate": 3.3763650860874898e-06, "loss": 1.3101, "step": 27043 }, { "epoch": 0.74, "learning_rate": 3.375702454576807e-06, "loss": 1.2839, "step": 27044 }, { "epoch": 0.74, "learning_rate": 3.375039874891517e-06, "loss": 1.2039, "step": 27045 }, { "epoch": 0.74, "learning_rate": 3.3743773470367993e-06, "loss": 1.1309, "step": 27046 }, { "epoch": 0.74, "learning_rate": 3.373714871017837e-06, "loss": 1.3889, "step": 27047 }, { "epoch": 0.74, "learning_rate": 3.3730524468398107e-06, "loss": 1.3362, "step": 27048 }, { "epoch": 0.74, "learning_rate": 3.3723900745079096e-06, "loss": 1.207, "step": 27049 }, { "epoch": 0.74, "learning_rate": 3.371727754027312e-06, "loss": 1.3413, "step": 27050 }, { "epoch": 0.74, "learning_rate": 3.3710654854031964e-06, "loss": 1.4199, "step": 27051 }, { "epoch": 0.74, "learning_rate": 3.3704032686407507e-06, "loss": 1.2771, "step": 27052 }, { "epoch": 0.74, "learning_rate": 3.369741103745152e-06, "loss": 1.2651, "step": 27053 }, { "epoch": 0.74, "learning_rate": 3.3690789907215813e-06, "loss": 1.437, "step": 27054 }, { "epoch": 0.74, "learning_rate": 3.3684169295752147e-06, "loss": 1.1901, "step": 27055 }, { "epoch": 0.74, "learning_rate": 3.367754920311239e-06, "loss": 1.3623, "step": 27056 }, { "epoch": 0.74, "learning_rate": 3.3670929629348313e-06, "loss": 1.2517, "step": 27057 }, { "epoch": 0.74, "learning_rate": 3.3664310574511683e-06, "loss": 1.2976, "step": 27058 }, { "epoch": 0.74, "learning_rate": 3.3657692038654256e-06, "loss": 1.1877, "step": 27059 }, { "epoch": 0.74, "learning_rate": 3.365107402182789e-06, "loss": 1.3452, "step": 27060 }, { "epoch": 0.74, "learning_rate": 3.3644456524084324e-06, "loss": 1.4331, "step": 27061 }, { "epoch": 0.74, "learning_rate": 3.3637839545475326e-06, "loss": 1.2349, "step": 27062 }, { "epoch": 0.74, "learning_rate": 3.363122308605263e-06, "loss": 1.314, "step": 27063 }, { "epoch": 0.74, "learning_rate": 3.362460714586807e-06, "loss": 1.2651, "step": 27064 }, { "epoch": 0.74, "learning_rate": 3.3617991724973364e-06, "loss": 1.3496, "step": 27065 }, { "epoch": 0.74, "learning_rate": 3.361137682342026e-06, "loss": 1.2551, "step": 27066 }, { "epoch": 0.74, "learning_rate": 3.3604762441260542e-06, "loss": 1.2417, "step": 27067 }, { "epoch": 0.74, "learning_rate": 3.3598148578545953e-06, "loss": 1.3086, "step": 27068 }, { "epoch": 0.74, "learning_rate": 3.3591535235328223e-06, "loss": 1.3213, "step": 27069 }, { "epoch": 0.74, "learning_rate": 3.3584922411659048e-06, "loss": 1.2451, "step": 27070 }, { "epoch": 0.74, "learning_rate": 3.357831010759026e-06, "loss": 1.1614, "step": 27071 }, { "epoch": 0.74, "learning_rate": 3.357169832317353e-06, "loss": 1.2847, "step": 27072 }, { "epoch": 0.74, "learning_rate": 3.35650870584606e-06, "loss": 1.3687, "step": 27073 }, { "epoch": 0.74, "learning_rate": 3.3558476313503153e-06, "loss": 1.2004, "step": 27074 }, { "epoch": 0.74, "learning_rate": 3.355186608835298e-06, "loss": 1.2623, "step": 27075 }, { "epoch": 0.74, "learning_rate": 3.3545256383061764e-06, "loss": 1.2017, "step": 27076 }, { "epoch": 0.74, "learning_rate": 3.3538647197681206e-06, "loss": 1.0719, "step": 27077 }, { "epoch": 0.74, "learning_rate": 3.353203853226299e-06, "loss": 1.3184, "step": 27078 }, { "epoch": 0.74, "learning_rate": 3.3525430386858846e-06, "loss": 1.2607, "step": 27079 }, { "epoch": 0.74, "learning_rate": 3.351882276152051e-06, "loss": 1.3379, "step": 27080 }, { "epoch": 0.74, "learning_rate": 3.351221565629964e-06, "loss": 1.2178, "step": 27081 }, { "epoch": 0.74, "learning_rate": 3.3505609071247937e-06, "loss": 1.3284, "step": 27082 }, { "epoch": 0.74, "learning_rate": 3.3499003006417042e-06, "loss": 1.3271, "step": 27083 }, { "epoch": 0.74, "learning_rate": 3.3492397461858717e-06, "loss": 1.3076, "step": 27084 }, { "epoch": 0.74, "learning_rate": 3.34857924376246e-06, "loss": 1.2502, "step": 27085 }, { "epoch": 0.74, "learning_rate": 3.3479187933766354e-06, "loss": 1.8579, "step": 27086 }, { "epoch": 0.74, "learning_rate": 3.3472583950335633e-06, "loss": 1.3623, "step": 27087 }, { "epoch": 0.74, "learning_rate": 3.3465980487384175e-06, "loss": 1.2915, "step": 27088 }, { "epoch": 0.74, "learning_rate": 3.3459377544963587e-06, "loss": 1.3228, "step": 27089 }, { "epoch": 0.74, "learning_rate": 3.345277512312555e-06, "loss": 1.2104, "step": 27090 }, { "epoch": 0.74, "learning_rate": 3.3446173221921664e-06, "loss": 1.1487, "step": 27091 }, { "epoch": 0.74, "learning_rate": 3.3439571841403663e-06, "loss": 1.2441, "step": 27092 }, { "epoch": 0.74, "learning_rate": 3.343297098162315e-06, "loss": 1.2905, "step": 27093 }, { "epoch": 0.74, "learning_rate": 3.3426370642631733e-06, "loss": 1.1482, "step": 27094 }, { "epoch": 0.74, "learning_rate": 3.3419770824481135e-06, "loss": 1.2141, "step": 27095 }, { "epoch": 0.74, "learning_rate": 3.341317152722293e-06, "loss": 0.9373, "step": 27096 }, { "epoch": 0.74, "learning_rate": 3.3406572750908762e-06, "loss": 1.334, "step": 27097 }, { "epoch": 0.74, "learning_rate": 3.3399974495590216e-06, "loss": 1.3079, "step": 27098 }, { "epoch": 0.74, "learning_rate": 3.3393376761319e-06, "loss": 1.2148, "step": 27099 }, { "epoch": 0.74, "learning_rate": 3.3386779548146663e-06, "loss": 1.1609, "step": 27100 }, { "epoch": 0.74, "learning_rate": 3.3380182856124855e-06, "loss": 1.4065, "step": 27101 }, { "epoch": 0.74, "learning_rate": 3.3373586685305124e-06, "loss": 1.2935, "step": 27102 }, { "epoch": 0.74, "learning_rate": 3.336699103573916e-06, "loss": 1.168, "step": 27103 }, { "epoch": 0.74, "learning_rate": 3.3360395907478527e-06, "loss": 1.2671, "step": 27104 }, { "epoch": 0.74, "learning_rate": 3.3353801300574818e-06, "loss": 1.3164, "step": 27105 }, { "epoch": 0.74, "learning_rate": 3.3347207215079603e-06, "loss": 1.2925, "step": 27106 }, { "epoch": 0.74, "learning_rate": 3.3340613651044518e-06, "loss": 1.355, "step": 27107 }, { "epoch": 0.74, "learning_rate": 3.3334020608521134e-06, "loss": 1.0996, "step": 27108 }, { "epoch": 0.74, "learning_rate": 3.332742808756102e-06, "loss": 1.2112, "step": 27109 }, { "epoch": 0.74, "learning_rate": 3.3320836088215725e-06, "loss": 1.2283, "step": 27110 }, { "epoch": 0.74, "learning_rate": 3.331424461053685e-06, "loss": 1.2295, "step": 27111 }, { "epoch": 0.74, "learning_rate": 3.3307653654576044e-06, "loss": 1.3391, "step": 27112 }, { "epoch": 0.74, "learning_rate": 3.330106322038472e-06, "loss": 1.178, "step": 27113 }, { "epoch": 0.74, "learning_rate": 3.329447330801455e-06, "loss": 1.2649, "step": 27114 }, { "epoch": 0.74, "learning_rate": 3.3287883917517016e-06, "loss": 1.1111, "step": 27115 }, { "epoch": 0.74, "learning_rate": 3.3281295048943785e-06, "loss": 1.3108, "step": 27116 }, { "epoch": 0.74, "learning_rate": 3.3274706702346248e-06, "loss": 1.2356, "step": 27117 }, { "epoch": 0.74, "learning_rate": 3.326811887777607e-06, "loss": 1.3955, "step": 27118 }, { "epoch": 0.74, "learning_rate": 3.326153157528472e-06, "loss": 1.2441, "step": 27119 }, { "epoch": 0.74, "learning_rate": 3.3254944794923825e-06, "loss": 1.2307, "step": 27120 }, { "epoch": 0.74, "learning_rate": 3.3248358536744795e-06, "loss": 1.3613, "step": 27121 }, { "epoch": 0.74, "learning_rate": 3.3241772800799244e-06, "loss": 1.3037, "step": 27122 }, { "epoch": 0.74, "learning_rate": 3.323518758713864e-06, "loss": 1.1887, "step": 27123 }, { "epoch": 0.74, "learning_rate": 3.32286028958146e-06, "loss": 1.3708, "step": 27124 }, { "epoch": 0.74, "learning_rate": 3.3222018726878515e-06, "loss": 1.3071, "step": 27125 }, { "epoch": 0.74, "learning_rate": 3.321543508038194e-06, "loss": 1.2151, "step": 27126 }, { "epoch": 0.74, "learning_rate": 3.3208851956376443e-06, "loss": 1.1738, "step": 27127 }, { "epoch": 0.74, "learning_rate": 3.3202269354913473e-06, "loss": 1.175, "step": 27128 }, { "epoch": 0.74, "learning_rate": 3.3195687276044543e-06, "loss": 1.2629, "step": 27129 }, { "epoch": 0.74, "learning_rate": 3.31891057198211e-06, "loss": 1.3784, "step": 27130 }, { "epoch": 0.74, "learning_rate": 3.3182524686294713e-06, "loss": 1.2683, "step": 27131 }, { "epoch": 0.74, "learning_rate": 3.3175944175516838e-06, "loss": 1.238, "step": 27132 }, { "epoch": 0.74, "learning_rate": 3.3169364187538955e-06, "loss": 1.2312, "step": 27133 }, { "epoch": 0.74, "learning_rate": 3.31627847224125e-06, "loss": 1.2654, "step": 27134 }, { "epoch": 0.74, "learning_rate": 3.315620578018903e-06, "loss": 1.4246, "step": 27135 }, { "epoch": 0.74, "learning_rate": 3.3149627360919966e-06, "loss": 1.7866, "step": 27136 }, { "epoch": 0.74, "learning_rate": 3.3143049464656785e-06, "loss": 1.272, "step": 27137 }, { "epoch": 0.74, "learning_rate": 3.313647209145091e-06, "loss": 1.2368, "step": 27138 }, { "epoch": 0.74, "learning_rate": 3.312989524135387e-06, "loss": 1.3081, "step": 27139 }, { "epoch": 0.74, "learning_rate": 3.3123318914417093e-06, "loss": 1.7329, "step": 27140 }, { "epoch": 0.74, "learning_rate": 3.3116743110691984e-06, "loss": 1.3347, "step": 27141 }, { "epoch": 0.74, "learning_rate": 3.3110167830230056e-06, "loss": 1.123, "step": 27142 }, { "epoch": 0.74, "learning_rate": 3.3103593073082717e-06, "loss": 1.301, "step": 27143 }, { "epoch": 0.74, "learning_rate": 3.309701883930142e-06, "loss": 1.2881, "step": 27144 }, { "epoch": 0.74, "learning_rate": 3.3090445128937554e-06, "loss": 1.6694, "step": 27145 }, { "epoch": 0.74, "learning_rate": 3.30838719420426e-06, "loss": 1.3279, "step": 27146 }, { "epoch": 0.74, "learning_rate": 3.3077299278667984e-06, "loss": 1.0986, "step": 27147 }, { "epoch": 0.74, "learning_rate": 3.30707271388651e-06, "loss": 1.2026, "step": 27148 }, { "epoch": 0.74, "learning_rate": 3.306415552268534e-06, "loss": 1.3384, "step": 27149 }, { "epoch": 0.74, "learning_rate": 3.305758443018019e-06, "loss": 1.3608, "step": 27150 }, { "epoch": 0.74, "learning_rate": 3.3051013861401014e-06, "loss": 1.2822, "step": 27151 }, { "epoch": 0.74, "learning_rate": 3.304444381639923e-06, "loss": 1.3269, "step": 27152 }, { "epoch": 0.74, "learning_rate": 3.3037874295226202e-06, "loss": 1.2651, "step": 27153 }, { "epoch": 0.74, "learning_rate": 3.303130529793339e-06, "loss": 1.3274, "step": 27154 }, { "epoch": 0.74, "learning_rate": 3.3024736824572146e-06, "loss": 1.1616, "step": 27155 }, { "epoch": 0.74, "learning_rate": 3.3018168875193848e-06, "loss": 1.1709, "step": 27156 }, { "epoch": 0.74, "learning_rate": 3.301160144984992e-06, "loss": 1.2134, "step": 27157 }, { "epoch": 0.74, "learning_rate": 3.3005034548591684e-06, "loss": 1.2051, "step": 27158 }, { "epoch": 0.74, "learning_rate": 3.299846817147063e-06, "loss": 1.312, "step": 27159 }, { "epoch": 0.74, "learning_rate": 3.2991902318537994e-06, "loss": 1.2468, "step": 27160 }, { "epoch": 0.74, "learning_rate": 3.298533698984523e-06, "loss": 1.3447, "step": 27161 }, { "epoch": 0.74, "learning_rate": 3.297877218544365e-06, "loss": 1.3105, "step": 27162 }, { "epoch": 0.74, "learning_rate": 3.29722079053847e-06, "loss": 1.2537, "step": 27163 }, { "epoch": 0.74, "learning_rate": 3.296564414971961e-06, "loss": 1.4038, "step": 27164 }, { "epoch": 0.74, "learning_rate": 3.2959080918499843e-06, "loss": 1.2185, "step": 27165 }, { "epoch": 0.74, "learning_rate": 3.2952518211776665e-06, "loss": 1.3174, "step": 27166 }, { "epoch": 0.74, "learning_rate": 3.294595602960151e-06, "loss": 1.3887, "step": 27167 }, { "epoch": 0.74, "learning_rate": 3.2939394372025613e-06, "loss": 1.7036, "step": 27168 }, { "epoch": 0.74, "learning_rate": 3.2932833239100383e-06, "loss": 1.3044, "step": 27169 }, { "epoch": 0.74, "learning_rate": 3.2926272630877098e-06, "loss": 1.2102, "step": 27170 }, { "epoch": 0.74, "learning_rate": 3.291971254740719e-06, "loss": 1.4006, "step": 27171 }, { "epoch": 0.74, "learning_rate": 3.2913152988741824e-06, "loss": 1.2117, "step": 27172 }, { "epoch": 0.74, "learning_rate": 3.290659395493242e-06, "loss": 1.3296, "step": 27173 }, { "epoch": 0.74, "learning_rate": 3.29000354460303e-06, "loss": 1.3354, "step": 27174 }, { "epoch": 0.74, "learning_rate": 3.2893477462086752e-06, "loss": 1.1333, "step": 27175 }, { "epoch": 0.74, "learning_rate": 3.2886920003153077e-06, "loss": 1.1296, "step": 27176 }, { "epoch": 0.74, "learning_rate": 3.2880363069280553e-06, "loss": 1.2649, "step": 27177 }, { "epoch": 0.74, "learning_rate": 3.2873806660520536e-06, "loss": 1.0356, "step": 27178 }, { "epoch": 0.74, "learning_rate": 3.2867250776924296e-06, "loss": 1.2087, "step": 27179 }, { "epoch": 0.74, "learning_rate": 3.286069541854312e-06, "loss": 1.3247, "step": 27180 }, { "epoch": 0.74, "learning_rate": 3.285414058542825e-06, "loss": 1.1587, "step": 27181 }, { "epoch": 0.74, "learning_rate": 3.284758627763105e-06, "loss": 1.3428, "step": 27182 }, { "epoch": 0.74, "learning_rate": 3.284103249520275e-06, "loss": 1.7202, "step": 27183 }, { "epoch": 0.74, "learning_rate": 3.283447923819464e-06, "loss": 1.2788, "step": 27184 }, { "epoch": 0.74, "learning_rate": 3.2827926506657937e-06, "loss": 1.2104, "step": 27185 }, { "epoch": 0.74, "learning_rate": 3.2821374300643994e-06, "loss": 1.3735, "step": 27186 }, { "epoch": 0.74, "learning_rate": 3.281482262020402e-06, "loss": 1.2695, "step": 27187 }, { "epoch": 0.74, "learning_rate": 3.280827146538925e-06, "loss": 1.2192, "step": 27188 }, { "epoch": 0.74, "learning_rate": 3.2801720836251006e-06, "loss": 1.2322, "step": 27189 }, { "epoch": 0.74, "learning_rate": 3.2795170732840496e-06, "loss": 1.2983, "step": 27190 }, { "epoch": 0.74, "learning_rate": 3.2788621155208977e-06, "loss": 1.261, "step": 27191 }, { "epoch": 0.74, "learning_rate": 3.278207210340764e-06, "loss": 1.1768, "step": 27192 }, { "epoch": 0.74, "learning_rate": 3.27755235774878e-06, "loss": 1.3147, "step": 27193 }, { "epoch": 0.74, "learning_rate": 3.276897557750065e-06, "loss": 1.3237, "step": 27194 }, { "epoch": 0.74, "learning_rate": 3.2762428103497413e-06, "loss": 1.4248, "step": 27195 }, { "epoch": 0.74, "learning_rate": 3.27558811555293e-06, "loss": 1.3635, "step": 27196 }, { "epoch": 0.74, "learning_rate": 3.2749334733647573e-06, "loss": 1.2524, "step": 27197 }, { "epoch": 0.74, "learning_rate": 3.274278883790344e-06, "loss": 1.1692, "step": 27198 }, { "epoch": 0.74, "learning_rate": 3.2736243468348093e-06, "loss": 1.2695, "step": 27199 }, { "epoch": 0.74, "learning_rate": 3.2729698625032714e-06, "loss": 1.3271, "step": 27200 }, { "epoch": 0.74, "learning_rate": 3.2723154308008576e-06, "loss": 1.2769, "step": 27201 }, { "epoch": 0.74, "learning_rate": 3.2716610517326854e-06, "loss": 1.2151, "step": 27202 }, { "epoch": 0.74, "learning_rate": 3.271006725303868e-06, "loss": 1.2839, "step": 27203 }, { "epoch": 0.74, "learning_rate": 3.270352451519534e-06, "loss": 1.3413, "step": 27204 }, { "epoch": 0.74, "learning_rate": 3.2696982303847947e-06, "loss": 1.1624, "step": 27205 }, { "epoch": 0.74, "learning_rate": 3.269044061904778e-06, "loss": 1.417, "step": 27206 }, { "epoch": 0.74, "learning_rate": 3.268389946084589e-06, "loss": 1.3289, "step": 27207 }, { "epoch": 0.74, "learning_rate": 3.267735882929355e-06, "loss": 1.1853, "step": 27208 }, { "epoch": 0.74, "learning_rate": 3.2670818724441865e-06, "loss": 1.1935, "step": 27209 }, { "epoch": 0.74, "learning_rate": 3.266427914634209e-06, "loss": 1.6724, "step": 27210 }, { "epoch": 0.74, "learning_rate": 3.2657740095045277e-06, "loss": 1.6704, "step": 27211 }, { "epoch": 0.74, "learning_rate": 3.2651201570602677e-06, "loss": 1.3386, "step": 27212 }, { "epoch": 0.74, "learning_rate": 3.2644663573065362e-06, "loss": 1.1877, "step": 27213 }, { "epoch": 0.74, "learning_rate": 3.263812610248459e-06, "loss": 1.1836, "step": 27214 }, { "epoch": 0.74, "learning_rate": 3.263158915891138e-06, "loss": 1.3232, "step": 27215 }, { "epoch": 0.74, "learning_rate": 3.262505274239698e-06, "loss": 1.3245, "step": 27216 }, { "epoch": 0.74, "learning_rate": 3.2618516852992445e-06, "loss": 1.3025, "step": 27217 }, { "epoch": 0.74, "learning_rate": 3.261198149074898e-06, "loss": 1.3896, "step": 27218 }, { "epoch": 0.74, "learning_rate": 3.260544665571769e-06, "loss": 1.2388, "step": 27219 }, { "epoch": 0.74, "learning_rate": 3.259891234794965e-06, "loss": 1.1707, "step": 27220 }, { "epoch": 0.74, "learning_rate": 3.2592378567496074e-06, "loss": 1.3376, "step": 27221 }, { "epoch": 0.74, "learning_rate": 3.2585845314408014e-06, "loss": 1.3262, "step": 27222 }, { "epoch": 0.74, "learning_rate": 3.257931258873661e-06, "loss": 1.0828, "step": 27223 }, { "epoch": 0.74, "learning_rate": 3.2572780390532934e-06, "loss": 1.1138, "step": 27224 }, { "epoch": 0.74, "learning_rate": 3.256624871984814e-06, "loss": 1.4031, "step": 27225 }, { "epoch": 0.74, "learning_rate": 3.255971757673331e-06, "loss": 1.2705, "step": 27226 }, { "epoch": 0.74, "learning_rate": 3.2553186961239536e-06, "loss": 1.23, "step": 27227 }, { "epoch": 0.74, "learning_rate": 3.254665687341788e-06, "loss": 1.3411, "step": 27228 }, { "epoch": 0.74, "learning_rate": 3.254012731331949e-06, "loss": 1.1731, "step": 27229 }, { "epoch": 0.74, "learning_rate": 3.2533598280995438e-06, "loss": 1.479, "step": 27230 }, { "epoch": 0.74, "learning_rate": 3.252706977649677e-06, "loss": 1.2012, "step": 27231 }, { "epoch": 0.74, "learning_rate": 3.252054179987455e-06, "loss": 1.2952, "step": 27232 }, { "epoch": 0.74, "learning_rate": 3.2514014351179922e-06, "loss": 1.2515, "step": 27233 }, { "epoch": 0.74, "learning_rate": 3.2507487430463903e-06, "loss": 1.3621, "step": 27234 }, { "epoch": 0.74, "learning_rate": 3.2500961037777532e-06, "loss": 1.2456, "step": 27235 }, { "epoch": 0.74, "learning_rate": 3.2494435173171947e-06, "loss": 1.7896, "step": 27236 }, { "epoch": 0.74, "learning_rate": 3.248790983669814e-06, "loss": 1.2593, "step": 27237 }, { "epoch": 0.74, "learning_rate": 3.2481385028407196e-06, "loss": 1.2773, "step": 27238 }, { "epoch": 0.74, "learning_rate": 3.24748607483501e-06, "loss": 1.2329, "step": 27239 }, { "epoch": 0.74, "learning_rate": 3.2468336996577985e-06, "loss": 1.375, "step": 27240 }, { "epoch": 0.74, "learning_rate": 3.2461813773141836e-06, "loss": 1.3562, "step": 27241 }, { "epoch": 0.74, "learning_rate": 3.24552910780927e-06, "loss": 1.2705, "step": 27242 }, { "epoch": 0.74, "learning_rate": 3.2448768911481577e-06, "loss": 1.2228, "step": 27243 }, { "epoch": 0.74, "learning_rate": 3.244224727335955e-06, "loss": 1.199, "step": 27244 }, { "epoch": 0.74, "learning_rate": 3.2435726163777614e-06, "loss": 1.2966, "step": 27245 }, { "epoch": 0.74, "learning_rate": 3.2429205582786782e-06, "loss": 1.2563, "step": 27246 }, { "epoch": 0.74, "learning_rate": 3.2422685530438048e-06, "loss": 1.3384, "step": 27247 }, { "epoch": 0.74, "learning_rate": 3.241616600678247e-06, "loss": 1.3079, "step": 27248 }, { "epoch": 0.74, "learning_rate": 3.2409647011871025e-06, "loss": 1.2986, "step": 27249 }, { "epoch": 0.74, "learning_rate": 3.240312854575469e-06, "loss": 1.2874, "step": 27250 }, { "epoch": 0.74, "learning_rate": 3.2396610608484524e-06, "loss": 1.2322, "step": 27251 }, { "epoch": 0.74, "learning_rate": 3.2390093200111463e-06, "loss": 1.2947, "step": 27252 }, { "epoch": 0.74, "learning_rate": 3.2383576320686573e-06, "loss": 1.1885, "step": 27253 }, { "epoch": 0.74, "learning_rate": 3.2377059970260725e-06, "loss": 1.2468, "step": 27254 }, { "epoch": 0.74, "learning_rate": 3.2370544148884998e-06, "loss": 1.2422, "step": 27255 }, { "epoch": 0.74, "learning_rate": 3.23640288566103e-06, "loss": 1.3889, "step": 27256 }, { "epoch": 0.74, "learning_rate": 3.2357514093487694e-06, "loss": 1.175, "step": 27257 }, { "epoch": 0.74, "learning_rate": 3.2350999859568033e-06, "loss": 1.3269, "step": 27258 }, { "epoch": 0.74, "learning_rate": 3.2344486154902366e-06, "loss": 1.3572, "step": 27259 }, { "epoch": 0.74, "learning_rate": 3.2337972979541586e-06, "loss": 1.136, "step": 27260 }, { "epoch": 0.74, "learning_rate": 3.233146033353677e-06, "loss": 1.2739, "step": 27261 }, { "epoch": 0.74, "learning_rate": 3.2324948216938713e-06, "loss": 1.4026, "step": 27262 }, { "epoch": 0.74, "learning_rate": 3.2318436629798468e-06, "loss": 1.387, "step": 27263 }, { "epoch": 0.74, "learning_rate": 3.2311925572166923e-06, "loss": 1.2578, "step": 27264 }, { "epoch": 0.74, "learning_rate": 3.2305415044095066e-06, "loss": 1.2954, "step": 27265 }, { "epoch": 0.74, "learning_rate": 3.229890504563382e-06, "loss": 1.1777, "step": 27266 }, { "epoch": 0.74, "learning_rate": 3.2292395576834067e-06, "loss": 1.7017, "step": 27267 }, { "epoch": 0.74, "learning_rate": 3.228588663774681e-06, "loss": 1.168, "step": 27268 }, { "epoch": 0.74, "learning_rate": 3.227937822842293e-06, "loss": 1.2278, "step": 27269 }, { "epoch": 0.74, "learning_rate": 3.2272870348913355e-06, "loss": 1.2439, "step": 27270 }, { "epoch": 0.74, "learning_rate": 3.2266362999268953e-06, "loss": 1.325, "step": 27271 }, { "epoch": 0.74, "learning_rate": 3.2259856179540716e-06, "loss": 1.2107, "step": 27272 }, { "epoch": 0.74, "learning_rate": 3.2253349889779505e-06, "loss": 1.3394, "step": 27273 }, { "epoch": 0.74, "learning_rate": 3.2246844130036235e-06, "loss": 1.3611, "step": 27274 }, { "epoch": 0.74, "learning_rate": 3.2240338900361766e-06, "loss": 1.0796, "step": 27275 }, { "epoch": 0.74, "learning_rate": 3.223383420080705e-06, "loss": 1.3108, "step": 27276 }, { "epoch": 0.74, "learning_rate": 3.2227330031422952e-06, "loss": 1.3413, "step": 27277 }, { "epoch": 0.74, "learning_rate": 3.2220826392260352e-06, "loss": 1.2563, "step": 27278 }, { "epoch": 0.74, "learning_rate": 3.2214323283370096e-06, "loss": 1.3435, "step": 27279 }, { "epoch": 0.74, "learning_rate": 3.220782070480315e-06, "loss": 1.1477, "step": 27280 }, { "epoch": 0.75, "learning_rate": 3.2201318656610327e-06, "loss": 1.3296, "step": 27281 }, { "epoch": 0.75, "learning_rate": 3.219481713884246e-06, "loss": 1.0522, "step": 27282 }, { "epoch": 0.75, "learning_rate": 3.2188316151550515e-06, "loss": 1.28, "step": 27283 }, { "epoch": 0.75, "learning_rate": 3.2181815694785278e-06, "loss": 1.4089, "step": 27284 }, { "epoch": 0.75, "learning_rate": 3.2175315768597637e-06, "loss": 1.353, "step": 27285 }, { "epoch": 0.75, "learning_rate": 3.216881637303839e-06, "loss": 1.4089, "step": 27286 }, { "epoch": 0.75, "learning_rate": 3.216231750815847e-06, "loss": 1.2439, "step": 27287 }, { "epoch": 0.75, "learning_rate": 3.2155819174008674e-06, "loss": 1.0966, "step": 27288 }, { "epoch": 0.75, "learning_rate": 3.214932137063984e-06, "loss": 1.3811, "step": 27289 }, { "epoch": 0.75, "learning_rate": 3.214282409810279e-06, "loss": 1.2212, "step": 27290 }, { "epoch": 0.75, "learning_rate": 3.2136327356448393e-06, "loss": 1.147, "step": 27291 }, { "epoch": 0.75, "learning_rate": 3.2129831145727462e-06, "loss": 1.2461, "step": 27292 }, { "epoch": 0.75, "learning_rate": 3.2123335465990823e-06, "loss": 1.3574, "step": 27293 }, { "epoch": 0.75, "learning_rate": 3.2116840317289255e-06, "loss": 1.3582, "step": 27294 }, { "epoch": 0.75, "learning_rate": 3.211034569967365e-06, "loss": 1.0999, "step": 27295 }, { "epoch": 0.75, "learning_rate": 3.210385161319476e-06, "loss": 1.2986, "step": 27296 }, { "epoch": 0.75, "learning_rate": 3.209735805790338e-06, "loss": 1.3484, "step": 27297 }, { "epoch": 0.75, "learning_rate": 3.209086503385038e-06, "loss": 1.1692, "step": 27298 }, { "epoch": 0.75, "learning_rate": 3.2084372541086484e-06, "loss": 1.269, "step": 27299 }, { "epoch": 0.75, "learning_rate": 3.207788057966258e-06, "loss": 1.2949, "step": 27300 }, { "epoch": 0.75, "learning_rate": 3.207138914962934e-06, "loss": 1.3062, "step": 27301 }, { "epoch": 0.75, "learning_rate": 3.2064898251037645e-06, "loss": 1.3479, "step": 27302 }, { "epoch": 0.75, "learning_rate": 3.2058407883938204e-06, "loss": 1.2458, "step": 27303 }, { "epoch": 0.75, "learning_rate": 3.2051918048381892e-06, "loss": 1.4458, "step": 27304 }, { "epoch": 0.75, "learning_rate": 3.204542874441936e-06, "loss": 1.0471, "step": 27305 }, { "epoch": 0.75, "learning_rate": 3.203893997210147e-06, "loss": 1.3528, "step": 27306 }, { "epoch": 0.75, "learning_rate": 3.203245173147893e-06, "loss": 1.2776, "step": 27307 }, { "epoch": 0.75, "learning_rate": 3.2025964022602584e-06, "loss": 1.333, "step": 27308 }, { "epoch": 0.75, "learning_rate": 3.201947684552307e-06, "loss": 1.3655, "step": 27309 }, { "epoch": 0.75, "learning_rate": 3.201299020029124e-06, "loss": 1.0786, "step": 27310 }, { "epoch": 0.75, "learning_rate": 3.2006504086957755e-06, "loss": 1.0762, "step": 27311 }, { "epoch": 0.75, "learning_rate": 3.200001850557346e-06, "loss": 1.0024, "step": 27312 }, { "epoch": 0.75, "learning_rate": 3.199353345618904e-06, "loss": 1.2527, "step": 27313 }, { "epoch": 0.75, "learning_rate": 3.1987048938855203e-06, "loss": 1.3223, "step": 27314 }, { "epoch": 0.75, "learning_rate": 3.198056495362274e-06, "loss": 1.2642, "step": 27315 }, { "epoch": 0.75, "learning_rate": 3.1974081500542366e-06, "loss": 1.2349, "step": 27316 }, { "epoch": 0.75, "learning_rate": 3.1967598579664773e-06, "loss": 1.415, "step": 27317 }, { "epoch": 0.75, "learning_rate": 3.1961116191040674e-06, "loss": 1.0886, "step": 27318 }, { "epoch": 0.75, "learning_rate": 3.1954634334720836e-06, "loss": 1.113, "step": 27319 }, { "epoch": 0.75, "learning_rate": 3.1948153010755945e-06, "loss": 1.2869, "step": 27320 }, { "epoch": 0.75, "learning_rate": 3.1941672219196705e-06, "loss": 1.2969, "step": 27321 }, { "epoch": 0.75, "learning_rate": 3.193519196009378e-06, "loss": 1.3884, "step": 27322 }, { "epoch": 0.75, "learning_rate": 3.192871223349795e-06, "loss": 1.3423, "step": 27323 }, { "epoch": 0.75, "learning_rate": 3.192223303945986e-06, "loss": 1.2048, "step": 27324 }, { "epoch": 0.75, "learning_rate": 3.1915754378030205e-06, "loss": 1.2876, "step": 27325 }, { "epoch": 0.75, "learning_rate": 3.1909276249259646e-06, "loss": 1.3328, "step": 27326 }, { "epoch": 0.75, "learning_rate": 3.190279865319892e-06, "loss": 1.3818, "step": 27327 }, { "epoch": 0.75, "learning_rate": 3.189632158989867e-06, "loss": 1.4922, "step": 27328 }, { "epoch": 0.75, "learning_rate": 3.1889845059409552e-06, "loss": 1.1887, "step": 27329 }, { "epoch": 0.75, "learning_rate": 3.1883369061782287e-06, "loss": 1.0875, "step": 27330 }, { "epoch": 0.75, "learning_rate": 3.1876893597067504e-06, "loss": 1.1895, "step": 27331 }, { "epoch": 0.75, "learning_rate": 3.1870418665315883e-06, "loss": 1.1366, "step": 27332 }, { "epoch": 0.75, "learning_rate": 3.186394426657803e-06, "loss": 1.1072, "step": 27333 }, { "epoch": 0.75, "learning_rate": 3.1857470400904676e-06, "loss": 1.1052, "step": 27334 }, { "epoch": 0.75, "learning_rate": 3.1850997068346423e-06, "loss": 1.2402, "step": 27335 }, { "epoch": 0.75, "learning_rate": 3.1844524268953936e-06, "loss": 1.302, "step": 27336 }, { "epoch": 0.75, "learning_rate": 3.18380520027778e-06, "loss": 1.1512, "step": 27337 }, { "epoch": 0.75, "learning_rate": 3.1831580269868724e-06, "loss": 1.3152, "step": 27338 }, { "epoch": 0.75, "learning_rate": 3.1825109070277317e-06, "loss": 1.3125, "step": 27339 }, { "epoch": 0.75, "learning_rate": 3.1818638404054193e-06, "loss": 1.2258, "step": 27340 }, { "epoch": 0.75, "learning_rate": 3.1812168271249944e-06, "loss": 1.2651, "step": 27341 }, { "epoch": 0.75, "learning_rate": 3.180569867191523e-06, "loss": 1.0444, "step": 27342 }, { "epoch": 0.75, "learning_rate": 3.17992296061007e-06, "loss": 1.2241, "step": 27343 }, { "epoch": 0.75, "learning_rate": 3.1792761073856927e-06, "loss": 1.2749, "step": 27344 }, { "epoch": 0.75, "learning_rate": 3.1786293075234507e-06, "loss": 1.4226, "step": 27345 }, { "epoch": 0.75, "learning_rate": 3.177982561028403e-06, "loss": 1.283, "step": 27346 }, { "epoch": 0.75, "learning_rate": 3.1773358679056153e-06, "loss": 1.3149, "step": 27347 }, { "epoch": 0.75, "learning_rate": 3.1766892281601425e-06, "loss": 1.2517, "step": 27348 }, { "epoch": 0.75, "learning_rate": 3.176042641797046e-06, "loss": 1.2021, "step": 27349 }, { "epoch": 0.75, "learning_rate": 3.1753961088213793e-06, "loss": 1.3711, "step": 27350 }, { "epoch": 0.75, "learning_rate": 3.174749629238206e-06, "loss": 1.314, "step": 27351 }, { "epoch": 0.75, "learning_rate": 3.1741032030525843e-06, "loss": 1.3638, "step": 27352 }, { "epoch": 0.75, "learning_rate": 3.173456830269568e-06, "loss": 1.1794, "step": 27353 }, { "epoch": 0.75, "learning_rate": 3.1728105108942133e-06, "loss": 1.3557, "step": 27354 }, { "epoch": 0.75, "learning_rate": 3.1721642449315814e-06, "loss": 1.313, "step": 27355 }, { "epoch": 0.75, "learning_rate": 3.171518032386726e-06, "loss": 1.2678, "step": 27356 }, { "epoch": 0.75, "learning_rate": 3.1708718732647015e-06, "loss": 0.9924, "step": 27357 }, { "epoch": 0.75, "learning_rate": 3.1702257675705615e-06, "loss": 1.3188, "step": 27358 }, { "epoch": 0.75, "learning_rate": 3.1695797153093677e-06, "loss": 1.1819, "step": 27359 }, { "epoch": 0.75, "learning_rate": 3.1689337164861687e-06, "loss": 1.2319, "step": 27360 }, { "epoch": 0.75, "learning_rate": 3.1682877711060176e-06, "loss": 1.1704, "step": 27361 }, { "epoch": 0.75, "learning_rate": 3.167641879173975e-06, "loss": 1.1797, "step": 27362 }, { "epoch": 0.75, "learning_rate": 3.1669960406950883e-06, "loss": 1.3928, "step": 27363 }, { "epoch": 0.75, "learning_rate": 3.166350255674412e-06, "loss": 1.1816, "step": 27364 }, { "epoch": 0.75, "learning_rate": 3.165704524116994e-06, "loss": 1.2896, "step": 27365 }, { "epoch": 0.75, "learning_rate": 3.165058846027893e-06, "loss": 1.1897, "step": 27366 }, { "epoch": 0.75, "learning_rate": 3.1644132214121583e-06, "loss": 1.3303, "step": 27367 }, { "epoch": 0.75, "learning_rate": 3.1637676502748404e-06, "loss": 1.2234, "step": 27368 }, { "epoch": 0.75, "learning_rate": 3.163122132620986e-06, "loss": 1.2202, "step": 27369 }, { "epoch": 0.75, "learning_rate": 3.1624766684556528e-06, "loss": 1.2161, "step": 27370 }, { "epoch": 0.75, "learning_rate": 3.161831257783886e-06, "loss": 1.1934, "step": 27371 }, { "epoch": 0.75, "learning_rate": 3.161185900610737e-06, "loss": 1.2031, "step": 27372 }, { "epoch": 0.75, "learning_rate": 3.1605405969412505e-06, "loss": 1.2371, "step": 27373 }, { "epoch": 0.75, "learning_rate": 3.1598953467804806e-06, "loss": 1.3372, "step": 27374 }, { "epoch": 0.75, "learning_rate": 3.159250150133474e-06, "loss": 1.3359, "step": 27375 }, { "epoch": 0.75, "learning_rate": 3.158605007005273e-06, "loss": 1.4102, "step": 27376 }, { "epoch": 0.75, "learning_rate": 3.1579599174009336e-06, "loss": 1.2454, "step": 27377 }, { "epoch": 0.75, "learning_rate": 3.157314881325495e-06, "loss": 1.3037, "step": 27378 }, { "epoch": 0.75, "learning_rate": 3.1566698987840138e-06, "loss": 1.2827, "step": 27379 }, { "epoch": 0.75, "learning_rate": 3.1560249697815228e-06, "loss": 1.3135, "step": 27380 }, { "epoch": 0.75, "learning_rate": 3.1553800943230773e-06, "loss": 1.2405, "step": 27381 }, { "epoch": 0.75, "learning_rate": 3.154735272413716e-06, "loss": 1.0989, "step": 27382 }, { "epoch": 0.75, "learning_rate": 3.1540905040584934e-06, "loss": 1.217, "step": 27383 }, { "epoch": 0.75, "learning_rate": 3.1534457892624414e-06, "loss": 1.1025, "step": 27384 }, { "epoch": 0.75, "learning_rate": 3.1528011280306126e-06, "loss": 1.2151, "step": 27385 }, { "epoch": 0.75, "learning_rate": 3.152156520368046e-06, "loss": 1.3579, "step": 27386 }, { "epoch": 0.75, "learning_rate": 3.151511966279792e-06, "loss": 1.4126, "step": 27387 }, { "epoch": 0.75, "learning_rate": 3.1508674657708815e-06, "loss": 1.3845, "step": 27388 }, { "epoch": 0.75, "learning_rate": 3.1502230188463644e-06, "loss": 1.2268, "step": 27389 }, { "epoch": 0.75, "learning_rate": 3.1495786255112837e-06, "loss": 1.2747, "step": 27390 }, { "epoch": 0.75, "learning_rate": 3.1489342857706795e-06, "loss": 1.2375, "step": 27391 }, { "epoch": 0.75, "learning_rate": 3.1482899996295914e-06, "loss": 1.3965, "step": 27392 }, { "epoch": 0.75, "learning_rate": 3.147645767093056e-06, "loss": 1.178, "step": 27393 }, { "epoch": 0.75, "learning_rate": 3.147001588166123e-06, "loss": 1.2778, "step": 27394 }, { "epoch": 0.75, "learning_rate": 3.1463574628538263e-06, "loss": 1.2766, "step": 27395 }, { "epoch": 0.75, "learning_rate": 3.145713391161206e-06, "loss": 1.3398, "step": 27396 }, { "epoch": 0.75, "learning_rate": 3.145069373093297e-06, "loss": 1.2693, "step": 27397 }, { "epoch": 0.75, "learning_rate": 3.1444254086551463e-06, "loss": 1.188, "step": 27398 }, { "epoch": 0.75, "learning_rate": 3.1437814978517865e-06, "loss": 1.0969, "step": 27399 }, { "epoch": 0.75, "learning_rate": 3.1431376406882564e-06, "loss": 1.3406, "step": 27400 }, { "epoch": 0.75, "learning_rate": 3.14249383716959e-06, "loss": 1.1146, "step": 27401 }, { "epoch": 0.75, "learning_rate": 3.1418500873008308e-06, "loss": 1.179, "step": 27402 }, { "epoch": 0.75, "learning_rate": 3.1412063910870116e-06, "loss": 1.3022, "step": 27403 }, { "epoch": 0.75, "learning_rate": 3.140562748533168e-06, "loss": 1.3503, "step": 27404 }, { "epoch": 0.75, "learning_rate": 3.1399191596443324e-06, "loss": 1.3157, "step": 27405 }, { "epoch": 0.75, "learning_rate": 3.1392756244255475e-06, "loss": 1.3173, "step": 27406 }, { "epoch": 0.75, "learning_rate": 3.1386321428818433e-06, "loss": 1.0844, "step": 27407 }, { "epoch": 0.75, "learning_rate": 3.137988715018252e-06, "loss": 1.335, "step": 27408 }, { "epoch": 0.75, "learning_rate": 3.1373453408398134e-06, "loss": 1.3821, "step": 27409 }, { "epoch": 0.75, "learning_rate": 3.1367020203515573e-06, "loss": 1.3501, "step": 27410 }, { "epoch": 0.75, "learning_rate": 3.1360587535585176e-06, "loss": 1.3779, "step": 27411 }, { "epoch": 0.75, "learning_rate": 3.135415540465724e-06, "loss": 1.219, "step": 27412 }, { "epoch": 0.75, "learning_rate": 3.134772381078214e-06, "loss": 1.4189, "step": 27413 }, { "epoch": 0.75, "learning_rate": 3.1341292754010157e-06, "loss": 1.1272, "step": 27414 }, { "epoch": 0.75, "learning_rate": 3.1334862234391627e-06, "loss": 1.3196, "step": 27415 }, { "epoch": 0.75, "learning_rate": 3.1328432251976804e-06, "loss": 1.2412, "step": 27416 }, { "epoch": 0.75, "learning_rate": 3.132200280681608e-06, "loss": 1.1021, "step": 27417 }, { "epoch": 0.75, "learning_rate": 3.1315573898959696e-06, "loss": 1.3662, "step": 27418 }, { "epoch": 0.75, "learning_rate": 3.1309145528457974e-06, "loss": 1.2065, "step": 27419 }, { "epoch": 0.75, "learning_rate": 3.1302717695361163e-06, "loss": 1.1228, "step": 27420 }, { "epoch": 0.75, "learning_rate": 3.1296290399719585e-06, "loss": 1.2625, "step": 27421 }, { "epoch": 0.75, "learning_rate": 3.1289863641583584e-06, "loss": 1.2275, "step": 27422 }, { "epoch": 0.75, "learning_rate": 3.1283437421003326e-06, "loss": 1.2307, "step": 27423 }, { "epoch": 0.75, "learning_rate": 3.127701173802916e-06, "loss": 1.2308, "step": 27424 }, { "epoch": 0.75, "learning_rate": 3.1270586592711316e-06, "loss": 1.2822, "step": 27425 }, { "epoch": 0.75, "learning_rate": 3.1264161985100137e-06, "loss": 1.4595, "step": 27426 }, { "epoch": 0.75, "learning_rate": 3.1257737915245778e-06, "loss": 1.2097, "step": 27427 }, { "epoch": 0.75, "learning_rate": 3.125131438319858e-06, "loss": 1.1816, "step": 27428 }, { "epoch": 0.75, "learning_rate": 3.1244891389008747e-06, "loss": 1.1726, "step": 27429 }, { "epoch": 0.75, "learning_rate": 3.123846893272662e-06, "loss": 1.2224, "step": 27430 }, { "epoch": 0.75, "learning_rate": 3.12320470144023e-06, "loss": 1.3108, "step": 27431 }, { "epoch": 0.75, "learning_rate": 3.1225625634086144e-06, "loss": 1.3574, "step": 27432 }, { "epoch": 0.75, "learning_rate": 3.1219204791828316e-06, "loss": 1.2188, "step": 27433 }, { "epoch": 0.75, "learning_rate": 3.121278448767916e-06, "loss": 1.4021, "step": 27434 }, { "epoch": 0.75, "learning_rate": 3.1206364721688763e-06, "loss": 1.1724, "step": 27435 }, { "epoch": 0.75, "learning_rate": 3.1199945493907425e-06, "loss": 1.7632, "step": 27436 }, { "epoch": 0.75, "learning_rate": 3.1193526804385386e-06, "loss": 1.2795, "step": 27437 }, { "epoch": 0.75, "learning_rate": 3.1187108653172835e-06, "loss": 1.0759, "step": 27438 }, { "epoch": 0.75, "learning_rate": 3.118069104032e-06, "loss": 1.3032, "step": 27439 }, { "epoch": 0.75, "learning_rate": 3.1174273965877043e-06, "loss": 1.1538, "step": 27440 }, { "epoch": 0.75, "learning_rate": 3.116785742989423e-06, "loss": 1.396, "step": 27441 }, { "epoch": 0.75, "learning_rate": 3.1161441432421733e-06, "loss": 1.3323, "step": 27442 }, { "epoch": 0.75, "learning_rate": 3.1155025973509745e-06, "loss": 1.3005, "step": 27443 }, { "epoch": 0.75, "learning_rate": 3.1148611053208432e-06, "loss": 1.2607, "step": 27444 }, { "epoch": 0.75, "learning_rate": 3.114219667156805e-06, "loss": 1.4185, "step": 27445 }, { "epoch": 0.75, "learning_rate": 3.1135782828638727e-06, "loss": 1.1765, "step": 27446 }, { "epoch": 0.75, "learning_rate": 3.1129369524470666e-06, "loss": 1.2175, "step": 27447 }, { "epoch": 0.75, "learning_rate": 3.1122956759113997e-06, "loss": 1.1843, "step": 27448 }, { "epoch": 0.75, "learning_rate": 3.1116544532618963e-06, "loss": 1.4312, "step": 27449 }, { "epoch": 0.75, "learning_rate": 3.111013284503569e-06, "loss": 1.2249, "step": 27450 }, { "epoch": 0.75, "learning_rate": 3.1103721696414314e-06, "loss": 1.4331, "step": 27451 }, { "epoch": 0.75, "learning_rate": 3.109731108680505e-06, "loss": 1.1421, "step": 27452 }, { "epoch": 0.75, "learning_rate": 3.1090901016258023e-06, "loss": 1.2373, "step": 27453 }, { "epoch": 0.75, "learning_rate": 3.108449148482339e-06, "loss": 1.2261, "step": 27454 }, { "epoch": 0.75, "learning_rate": 3.1078082492551254e-06, "loss": 1.3721, "step": 27455 }, { "epoch": 0.75, "learning_rate": 3.107167403949182e-06, "loss": 1.1272, "step": 27456 }, { "epoch": 0.75, "learning_rate": 3.10652661256952e-06, "loss": 1.1812, "step": 27457 }, { "epoch": 0.75, "learning_rate": 3.105885875121152e-06, "loss": 1.2209, "step": 27458 }, { "epoch": 0.75, "learning_rate": 3.1052451916090875e-06, "loss": 1.1353, "step": 27459 }, { "epoch": 0.75, "learning_rate": 3.104604562038347e-06, "loss": 1.2122, "step": 27460 }, { "epoch": 0.75, "learning_rate": 3.1039639864139372e-06, "loss": 1.2183, "step": 27461 }, { "epoch": 0.75, "learning_rate": 3.1033234647408696e-06, "loss": 1.3835, "step": 27462 }, { "epoch": 0.75, "learning_rate": 3.1026829970241536e-06, "loss": 1.2271, "step": 27463 }, { "epoch": 0.75, "learning_rate": 3.102042583268806e-06, "loss": 1.3403, "step": 27464 }, { "epoch": 0.75, "learning_rate": 3.1014022234798333e-06, "loss": 1.4304, "step": 27465 }, { "epoch": 0.75, "learning_rate": 3.100761917662246e-06, "loss": 1.1855, "step": 27466 }, { "epoch": 0.75, "learning_rate": 3.1001216658210497e-06, "loss": 1.2876, "step": 27467 }, { "epoch": 0.75, "learning_rate": 3.099481467961256e-06, "loss": 1.2476, "step": 27468 }, { "epoch": 0.75, "learning_rate": 3.0988413240878825e-06, "loss": 1.3103, "step": 27469 }, { "epoch": 0.75, "learning_rate": 3.098201234205922e-06, "loss": 1.3232, "step": 27470 }, { "epoch": 0.75, "learning_rate": 3.0975611983203935e-06, "loss": 1.3169, "step": 27471 }, { "epoch": 0.75, "learning_rate": 3.096921216436296e-06, "loss": 1.2642, "step": 27472 }, { "epoch": 0.75, "learning_rate": 3.096281288558648e-06, "loss": 1.2522, "step": 27473 }, { "epoch": 0.75, "learning_rate": 3.095641414692443e-06, "loss": 1.1575, "step": 27474 }, { "epoch": 0.75, "learning_rate": 3.095001594842695e-06, "loss": 1.2397, "step": 27475 }, { "epoch": 0.75, "learning_rate": 3.094361829014405e-06, "loss": 1.3853, "step": 27476 }, { "epoch": 0.75, "learning_rate": 3.0937221172125877e-06, "loss": 1.0649, "step": 27477 }, { "epoch": 0.75, "learning_rate": 3.093082459442234e-06, "loss": 1.2327, "step": 27478 }, { "epoch": 0.75, "learning_rate": 3.0924428557083575e-06, "loss": 1.217, "step": 27479 }, { "epoch": 0.75, "learning_rate": 3.0918033060159582e-06, "loss": 1.2825, "step": 27480 }, { "epoch": 0.75, "learning_rate": 3.091163810370047e-06, "loss": 1.4124, "step": 27481 }, { "epoch": 0.75, "learning_rate": 3.090524368775616e-06, "loss": 1.3076, "step": 27482 }, { "epoch": 0.75, "learning_rate": 3.089884981237672e-06, "loss": 1.1023, "step": 27483 }, { "epoch": 0.75, "learning_rate": 3.0892456477612223e-06, "loss": 1.1887, "step": 27484 }, { "epoch": 0.75, "learning_rate": 3.0886063683512647e-06, "loss": 1.2334, "step": 27485 }, { "epoch": 0.75, "learning_rate": 3.087967143012801e-06, "loss": 1.2498, "step": 27486 }, { "epoch": 0.75, "learning_rate": 3.08732797175083e-06, "loss": 1.2156, "step": 27487 }, { "epoch": 0.75, "learning_rate": 3.0866888545703565e-06, "loss": 1.175, "step": 27488 }, { "epoch": 0.75, "learning_rate": 3.0860497914763786e-06, "loss": 1.3904, "step": 27489 }, { "epoch": 0.75, "learning_rate": 3.0854107824738955e-06, "loss": 1.2654, "step": 27490 }, { "epoch": 0.75, "learning_rate": 3.084771827567905e-06, "loss": 1.3096, "step": 27491 }, { "epoch": 0.75, "learning_rate": 3.08413292676341e-06, "loss": 1.2902, "step": 27492 }, { "epoch": 0.75, "learning_rate": 3.083494080065408e-06, "loss": 1.2822, "step": 27493 }, { "epoch": 0.75, "learning_rate": 3.082855287478894e-06, "loss": 1.4458, "step": 27494 }, { "epoch": 0.75, "learning_rate": 3.0822165490088664e-06, "loss": 1.322, "step": 27495 }, { "epoch": 0.75, "learning_rate": 3.0815778646603257e-06, "loss": 1.2822, "step": 27496 }, { "epoch": 0.75, "learning_rate": 3.080939234438267e-06, "loss": 1.4519, "step": 27497 }, { "epoch": 0.75, "learning_rate": 3.0803006583476825e-06, "loss": 1.4102, "step": 27498 }, { "epoch": 0.75, "learning_rate": 3.0796621363935753e-06, "loss": 1.2925, "step": 27499 }, { "epoch": 0.75, "learning_rate": 3.0790236685809384e-06, "loss": 1.2268, "step": 27500 }, { "epoch": 0.75, "learning_rate": 3.078385254914764e-06, "loss": 1.4353, "step": 27501 }, { "epoch": 0.75, "learning_rate": 3.0777468954000466e-06, "loss": 1.21, "step": 27502 }, { "epoch": 0.75, "learning_rate": 3.077108590041785e-06, "loss": 1.1453, "step": 27503 }, { "epoch": 0.75, "learning_rate": 3.0764703388449703e-06, "loss": 1.175, "step": 27504 }, { "epoch": 0.75, "learning_rate": 3.0758321418145965e-06, "loss": 1.3176, "step": 27505 }, { "epoch": 0.75, "learning_rate": 3.0751939989556533e-06, "loss": 1.2517, "step": 27506 }, { "epoch": 0.75, "learning_rate": 3.074555910273138e-06, "loss": 1.1699, "step": 27507 }, { "epoch": 0.75, "learning_rate": 3.073917875772041e-06, "loss": 1.3799, "step": 27508 }, { "epoch": 0.75, "learning_rate": 3.073279895457354e-06, "loss": 1.3264, "step": 27509 }, { "epoch": 0.75, "learning_rate": 3.072641969334065e-06, "loss": 1.3623, "step": 27510 }, { "epoch": 0.75, "learning_rate": 3.0720040974071708e-06, "loss": 1.1169, "step": 27511 }, { "epoch": 0.75, "learning_rate": 3.071366279681658e-06, "loss": 1.3652, "step": 27512 }, { "epoch": 0.75, "learning_rate": 3.0707285161625158e-06, "loss": 1.4106, "step": 27513 }, { "epoch": 0.75, "learning_rate": 3.0700908068547362e-06, "loss": 1.2612, "step": 27514 }, { "epoch": 0.75, "learning_rate": 3.0694531517633063e-06, "loss": 1.3057, "step": 27515 }, { "epoch": 0.75, "learning_rate": 3.0688155508932217e-06, "loss": 1.062, "step": 27516 }, { "epoch": 0.75, "learning_rate": 3.068178004249458e-06, "loss": 1.3845, "step": 27517 }, { "epoch": 0.75, "learning_rate": 3.0675405118370138e-06, "loss": 1.2996, "step": 27518 }, { "epoch": 0.75, "learning_rate": 3.0669030736608698e-06, "loss": 1.064, "step": 27519 }, { "epoch": 0.75, "learning_rate": 3.0662656897260213e-06, "loss": 1.3081, "step": 27520 }, { "epoch": 0.75, "learning_rate": 3.065628360037444e-06, "loss": 1.1887, "step": 27521 }, { "epoch": 0.75, "learning_rate": 3.064991084600133e-06, "loss": 1.2034, "step": 27522 }, { "epoch": 0.75, "learning_rate": 3.0643538634190673e-06, "loss": 1.229, "step": 27523 }, { "epoch": 0.75, "learning_rate": 3.0637166964992416e-06, "loss": 1.3508, "step": 27524 }, { "epoch": 0.75, "learning_rate": 3.0630795838456282e-06, "loss": 1.1685, "step": 27525 }, { "epoch": 0.75, "learning_rate": 3.0624425254632217e-06, "loss": 1.3523, "step": 27526 }, { "epoch": 0.75, "learning_rate": 3.061805521357e-06, "loss": 1.2827, "step": 27527 }, { "epoch": 0.75, "learning_rate": 3.061168571531955e-06, "loss": 1.261, "step": 27528 }, { "epoch": 0.75, "learning_rate": 3.060531675993058e-06, "loss": 1.3789, "step": 27529 }, { "epoch": 0.75, "learning_rate": 3.059894834745298e-06, "loss": 1.322, "step": 27530 }, { "epoch": 0.75, "learning_rate": 3.0592580477936606e-06, "loss": 1.3223, "step": 27531 }, { "epoch": 0.75, "learning_rate": 3.0586213151431254e-06, "loss": 1.4026, "step": 27532 }, { "epoch": 0.75, "learning_rate": 3.057984636798672e-06, "loss": 1.1848, "step": 27533 }, { "epoch": 0.75, "learning_rate": 3.0573480127652786e-06, "loss": 1.2871, "step": 27534 }, { "epoch": 0.75, "learning_rate": 3.056711443047934e-06, "loss": 1.2095, "step": 27535 }, { "epoch": 0.75, "learning_rate": 3.0560749276516145e-06, "loss": 1.323, "step": 27536 }, { "epoch": 0.75, "learning_rate": 3.055438466581299e-06, "loss": 1.2217, "step": 27537 }, { "epoch": 0.75, "learning_rate": 3.0548020598419625e-06, "loss": 1.2839, "step": 27538 }, { "epoch": 0.75, "learning_rate": 3.0541657074385942e-06, "loss": 1.3167, "step": 27539 }, { "epoch": 0.75, "learning_rate": 3.053529409376166e-06, "loss": 1.3521, "step": 27540 }, { "epoch": 0.75, "learning_rate": 3.0528931656596584e-06, "loss": 1.3577, "step": 27541 }, { "epoch": 0.75, "learning_rate": 3.0522569762940434e-06, "loss": 1.3181, "step": 27542 }, { "epoch": 0.75, "learning_rate": 3.0516208412843064e-06, "loss": 1.3066, "step": 27543 }, { "epoch": 0.75, "learning_rate": 3.0509847606354215e-06, "loss": 1.1372, "step": 27544 }, { "epoch": 0.75, "learning_rate": 3.0503487343523596e-06, "loss": 1.1221, "step": 27545 }, { "epoch": 0.75, "learning_rate": 3.0497127624401057e-06, "loss": 1.2744, "step": 27546 }, { "epoch": 0.75, "learning_rate": 3.04907684490363e-06, "loss": 1.3208, "step": 27547 }, { "epoch": 0.75, "learning_rate": 3.0484409817479087e-06, "loss": 1.2842, "step": 27548 }, { "epoch": 0.75, "learning_rate": 3.0478051729779135e-06, "loss": 1.208, "step": 27549 }, { "epoch": 0.75, "learning_rate": 3.0471694185986245e-06, "loss": 1.3843, "step": 27550 }, { "epoch": 0.75, "learning_rate": 3.0465337186150125e-06, "loss": 1.3127, "step": 27551 }, { "epoch": 0.75, "learning_rate": 3.0458980730320496e-06, "loss": 1.158, "step": 27552 }, { "epoch": 0.75, "learning_rate": 3.0452624818547092e-06, "loss": 1.1555, "step": 27553 }, { "epoch": 0.75, "learning_rate": 3.0446269450879663e-06, "loss": 1.2322, "step": 27554 }, { "epoch": 0.75, "learning_rate": 3.0439914627367926e-06, "loss": 1.2695, "step": 27555 }, { "epoch": 0.75, "learning_rate": 3.0433560348061584e-06, "loss": 1.3833, "step": 27556 }, { "epoch": 0.75, "learning_rate": 3.0427206613010317e-06, "loss": 1.1836, "step": 27557 }, { "epoch": 0.75, "learning_rate": 3.0420853422263908e-06, "loss": 1.3477, "step": 27558 }, { "epoch": 0.75, "learning_rate": 3.0414500775872023e-06, "loss": 1.3015, "step": 27559 }, { "epoch": 0.75, "learning_rate": 3.0408148673884332e-06, "loss": 1.0322, "step": 27560 }, { "epoch": 0.75, "learning_rate": 3.0401797116350586e-06, "loss": 1.7212, "step": 27561 }, { "epoch": 0.75, "learning_rate": 3.0395446103320425e-06, "loss": 1.2915, "step": 27562 }, { "epoch": 0.75, "learning_rate": 3.0389095634843626e-06, "loss": 1.1129, "step": 27563 }, { "epoch": 0.75, "learning_rate": 3.0382745710969742e-06, "loss": 1.373, "step": 27564 }, { "epoch": 0.75, "learning_rate": 3.037639633174856e-06, "loss": 1.2737, "step": 27565 }, { "epoch": 0.75, "learning_rate": 3.0370047497229673e-06, "loss": 1.4343, "step": 27566 }, { "epoch": 0.75, "learning_rate": 3.036369920746286e-06, "loss": 1.229, "step": 27567 }, { "epoch": 0.75, "learning_rate": 3.0357351462497653e-06, "loss": 1.3206, "step": 27568 }, { "epoch": 0.75, "learning_rate": 3.035100426238382e-06, "loss": 1.2192, "step": 27569 }, { "epoch": 0.75, "learning_rate": 3.0344657607170937e-06, "loss": 1.4214, "step": 27570 }, { "epoch": 0.75, "learning_rate": 3.033831149690877e-06, "loss": 1.3042, "step": 27571 }, { "epoch": 0.75, "learning_rate": 3.033196593164682e-06, "loss": 1.2751, "step": 27572 }, { "epoch": 0.75, "learning_rate": 3.032562091143485e-06, "loss": 1.2905, "step": 27573 }, { "epoch": 0.75, "learning_rate": 3.0319276436322433e-06, "loss": 1.1997, "step": 27574 }, { "epoch": 0.75, "learning_rate": 3.0312932506359248e-06, "loss": 1.1656, "step": 27575 }, { "epoch": 0.75, "learning_rate": 3.030658912159492e-06, "loss": 1.1694, "step": 27576 }, { "epoch": 0.75, "learning_rate": 3.0300246282079036e-06, "loss": 1.3228, "step": 27577 }, { "epoch": 0.75, "learning_rate": 3.0293903987861273e-06, "loss": 1.2781, "step": 27578 }, { "epoch": 0.75, "learning_rate": 3.028756223899123e-06, "loss": 1.1948, "step": 27579 }, { "epoch": 0.75, "learning_rate": 3.0281221035518527e-06, "loss": 1.2336, "step": 27580 }, { "epoch": 0.75, "learning_rate": 3.0274880377492734e-06, "loss": 1.2471, "step": 27581 }, { "epoch": 0.75, "learning_rate": 3.026854026496351e-06, "loss": 1.2781, "step": 27582 }, { "epoch": 0.75, "learning_rate": 3.026220069798045e-06, "loss": 1.3293, "step": 27583 }, { "epoch": 0.75, "learning_rate": 3.0255861676593124e-06, "loss": 1.4041, "step": 27584 }, { "epoch": 0.75, "learning_rate": 3.0249523200851117e-06, "loss": 1.4016, "step": 27585 }, { "epoch": 0.75, "learning_rate": 3.0243185270804075e-06, "loss": 1.3645, "step": 27586 }, { "epoch": 0.75, "learning_rate": 3.023684788650154e-06, "loss": 1.3103, "step": 27587 }, { "epoch": 0.75, "learning_rate": 3.0230511047993115e-06, "loss": 1.1963, "step": 27588 }, { "epoch": 0.75, "learning_rate": 3.022417475532833e-06, "loss": 1.4629, "step": 27589 }, { "epoch": 0.75, "learning_rate": 3.0217839008556816e-06, "loss": 1.2847, "step": 27590 }, { "epoch": 0.75, "learning_rate": 3.0211503807728117e-06, "loss": 1.1672, "step": 27591 }, { "epoch": 0.75, "learning_rate": 3.020516915289177e-06, "loss": 1.2314, "step": 27592 }, { "epoch": 0.75, "learning_rate": 3.0198835044097386e-06, "loss": 1.2246, "step": 27593 }, { "epoch": 0.75, "learning_rate": 3.0192501481394488e-06, "loss": 1.2522, "step": 27594 }, { "epoch": 0.75, "learning_rate": 3.018616846483264e-06, "loss": 1.1274, "step": 27595 }, { "epoch": 0.75, "learning_rate": 3.017983599446135e-06, "loss": 1.3806, "step": 27596 }, { "epoch": 0.75, "learning_rate": 3.0173504070330227e-06, "loss": 1.0928, "step": 27597 }, { "epoch": 0.75, "learning_rate": 3.0167172692488766e-06, "loss": 1.1699, "step": 27598 }, { "epoch": 0.75, "learning_rate": 3.016084186098651e-06, "loss": 1.1904, "step": 27599 }, { "epoch": 0.75, "learning_rate": 3.0154511575872957e-06, "loss": 1.2458, "step": 27600 }, { "epoch": 0.75, "learning_rate": 3.0148181837197687e-06, "loss": 1.1907, "step": 27601 }, { "epoch": 0.75, "learning_rate": 3.0141852645010206e-06, "loss": 1.2192, "step": 27602 }, { "epoch": 0.75, "learning_rate": 3.0135523999360007e-06, "loss": 1.2043, "step": 27603 }, { "epoch": 0.75, "learning_rate": 3.0129195900296594e-06, "loss": 1.197, "step": 27604 }, { "epoch": 0.75, "learning_rate": 3.0122868347869527e-06, "loss": 1.1851, "step": 27605 }, { "epoch": 0.75, "learning_rate": 3.011654134212825e-06, "loss": 1.2783, "step": 27606 }, { "epoch": 0.75, "learning_rate": 3.0110214883122312e-06, "loss": 1.3201, "step": 27607 }, { "epoch": 0.75, "learning_rate": 3.0103888970901208e-06, "loss": 1.1621, "step": 27608 }, { "epoch": 0.75, "learning_rate": 3.009756360551436e-06, "loss": 1.3091, "step": 27609 }, { "epoch": 0.75, "learning_rate": 3.0091238787011346e-06, "loss": 1.2471, "step": 27610 }, { "epoch": 0.75, "learning_rate": 3.00849145154416e-06, "loss": 1.0735, "step": 27611 }, { "epoch": 0.75, "learning_rate": 3.0078590790854613e-06, "loss": 1.0552, "step": 27612 }, { "epoch": 0.75, "learning_rate": 3.007226761329981e-06, "loss": 1.2556, "step": 27613 }, { "epoch": 0.75, "learning_rate": 3.0065944982826743e-06, "loss": 1.3608, "step": 27614 }, { "epoch": 0.75, "learning_rate": 3.005962289948483e-06, "loss": 1.126, "step": 27615 }, { "epoch": 0.75, "learning_rate": 3.005330136332355e-06, "loss": 1.2212, "step": 27616 }, { "epoch": 0.75, "learning_rate": 3.004698037439231e-06, "loss": 1.3245, "step": 27617 }, { "epoch": 0.75, "learning_rate": 3.0040659932740634e-06, "loss": 1.2273, "step": 27618 }, { "epoch": 0.75, "learning_rate": 3.003434003841794e-06, "loss": 1.3054, "step": 27619 }, { "epoch": 0.75, "learning_rate": 3.002802069147367e-06, "loss": 1.408, "step": 27620 }, { "epoch": 0.75, "learning_rate": 3.002170189195722e-06, "loss": 1.2256, "step": 27621 }, { "epoch": 0.75, "learning_rate": 3.0015383639918115e-06, "loss": 1.2415, "step": 27622 }, { "epoch": 0.75, "learning_rate": 3.0009065935405735e-06, "loss": 1.2417, "step": 27623 }, { "epoch": 0.75, "learning_rate": 3.000274877846947e-06, "loss": 1.4153, "step": 27624 }, { "epoch": 0.75, "learning_rate": 2.999643216915883e-06, "loss": 1.1997, "step": 27625 }, { "epoch": 0.75, "learning_rate": 2.999011610752317e-06, "loss": 1.291, "step": 27626 }, { "epoch": 0.75, "learning_rate": 2.998380059361193e-06, "loss": 1.3247, "step": 27627 }, { "epoch": 0.75, "learning_rate": 2.997748562747448e-06, "loss": 1.2954, "step": 27628 }, { "epoch": 0.75, "learning_rate": 2.9971171209160288e-06, "loss": 1.3433, "step": 27629 }, { "epoch": 0.75, "learning_rate": 2.9964857338718724e-06, "loss": 1.2632, "step": 27630 }, { "epoch": 0.75, "learning_rate": 2.9958544016199176e-06, "loss": 1.2139, "step": 27631 }, { "epoch": 0.75, "learning_rate": 2.995223124165102e-06, "loss": 1.2017, "step": 27632 }, { "epoch": 0.75, "learning_rate": 2.9945919015123692e-06, "loss": 1.4053, "step": 27633 }, { "epoch": 0.75, "learning_rate": 2.9939607336666554e-06, "loss": 1.1799, "step": 27634 }, { "epoch": 0.75, "learning_rate": 2.993329620632899e-06, "loss": 1.249, "step": 27635 }, { "epoch": 0.75, "learning_rate": 2.992698562416032e-06, "loss": 1.2092, "step": 27636 }, { "epoch": 0.75, "learning_rate": 2.992067559021001e-06, "loss": 1.2332, "step": 27637 }, { "epoch": 0.75, "learning_rate": 2.991436610452738e-06, "loss": 1.3037, "step": 27638 }, { "epoch": 0.75, "learning_rate": 2.9908057167161763e-06, "loss": 1.1624, "step": 27639 }, { "epoch": 0.75, "learning_rate": 2.9901748778162577e-06, "loss": 1.261, "step": 27640 }, { "epoch": 0.75, "learning_rate": 2.989544093757911e-06, "loss": 1.248, "step": 27641 }, { "epoch": 0.75, "learning_rate": 2.988913364546081e-06, "loss": 1.2271, "step": 27642 }, { "epoch": 0.75, "learning_rate": 2.98828269018569e-06, "loss": 1.1421, "step": 27643 }, { "epoch": 0.75, "learning_rate": 2.9876520706816813e-06, "loss": 1.0149, "step": 27644 }, { "epoch": 0.75, "learning_rate": 2.987021506038982e-06, "loss": 1.2412, "step": 27645 }, { "epoch": 0.75, "learning_rate": 2.9863909962625347e-06, "loss": 1.3652, "step": 27646 }, { "epoch": 0.76, "learning_rate": 2.985760541357261e-06, "loss": 1.3198, "step": 27647 }, { "epoch": 0.76, "learning_rate": 2.9851301413281007e-06, "loss": 1.2695, "step": 27648 }, { "epoch": 0.76, "learning_rate": 2.9844997961799814e-06, "loss": 1.1204, "step": 27649 }, { "epoch": 0.76, "learning_rate": 2.9838695059178425e-06, "loss": 1.252, "step": 27650 }, { "epoch": 0.76, "learning_rate": 2.983239270546603e-06, "loss": 1.2532, "step": 27651 }, { "epoch": 0.76, "learning_rate": 2.982609090071202e-06, "loss": 1.0776, "step": 27652 }, { "epoch": 0.76, "learning_rate": 2.9819789644965658e-06, "loss": 1.3342, "step": 27653 }, { "epoch": 0.76, "learning_rate": 2.981348893827629e-06, "loss": 1.3662, "step": 27654 }, { "epoch": 0.76, "learning_rate": 2.9807188780693184e-06, "loss": 1.4155, "step": 27655 }, { "epoch": 0.76, "learning_rate": 2.980088917226559e-06, "loss": 1.6768, "step": 27656 }, { "epoch": 0.76, "learning_rate": 2.9794590113042865e-06, "loss": 1.2092, "step": 27657 }, { "epoch": 0.76, "learning_rate": 2.9788291603074248e-06, "loss": 1.3213, "step": 27658 }, { "epoch": 0.76, "learning_rate": 2.9781993642409025e-06, "loss": 1.1415, "step": 27659 }, { "epoch": 0.76, "learning_rate": 2.977569623109643e-06, "loss": 1.3208, "step": 27660 }, { "epoch": 0.76, "learning_rate": 2.9769399369185804e-06, "loss": 1.3013, "step": 27661 }, { "epoch": 0.76, "learning_rate": 2.976310305672637e-06, "loss": 1.1116, "step": 27662 }, { "epoch": 0.76, "learning_rate": 2.9756807293767387e-06, "loss": 1.1897, "step": 27663 }, { "epoch": 0.76, "learning_rate": 2.9750512080358085e-06, "loss": 1.2024, "step": 27664 }, { "epoch": 0.76, "learning_rate": 2.974421741654777e-06, "loss": 1.2925, "step": 27665 }, { "epoch": 0.76, "learning_rate": 2.973792330238566e-06, "loss": 1.1912, "step": 27666 }, { "epoch": 0.76, "learning_rate": 2.9731629737921008e-06, "loss": 1.2136, "step": 27667 }, { "epoch": 0.76, "learning_rate": 2.9725336723203e-06, "loss": 1.2559, "step": 27668 }, { "epoch": 0.76, "learning_rate": 2.9719044258280947e-06, "loss": 1.3206, "step": 27669 }, { "epoch": 0.76, "learning_rate": 2.9712752343204054e-06, "loss": 1.3088, "step": 27670 }, { "epoch": 0.76, "learning_rate": 2.970646097802149e-06, "loss": 1.1697, "step": 27671 }, { "epoch": 0.76, "learning_rate": 2.970017016278256e-06, "loss": 1.2097, "step": 27672 }, { "epoch": 0.76, "learning_rate": 2.9693879897536436e-06, "loss": 1.1543, "step": 27673 }, { "epoch": 0.76, "learning_rate": 2.968759018233234e-06, "loss": 1.3291, "step": 27674 }, { "epoch": 0.76, "learning_rate": 2.9681301017219442e-06, "loss": 1.1709, "step": 27675 }, { "epoch": 0.76, "learning_rate": 2.9675012402247007e-06, "loss": 1.2434, "step": 27676 }, { "epoch": 0.76, "learning_rate": 2.9668724337464217e-06, "loss": 1.3311, "step": 27677 }, { "epoch": 0.76, "learning_rate": 2.9662436822920247e-06, "loss": 1.4868, "step": 27678 }, { "epoch": 0.76, "learning_rate": 2.9656149858664263e-06, "loss": 1.291, "step": 27679 }, { "epoch": 0.76, "learning_rate": 2.964986344474552e-06, "loss": 1.4404, "step": 27680 }, { "epoch": 0.76, "learning_rate": 2.9643577581213157e-06, "loss": 1.2051, "step": 27681 }, { "epoch": 0.76, "learning_rate": 2.9637292268116367e-06, "loss": 1.397, "step": 27682 }, { "epoch": 0.76, "learning_rate": 2.9631007505504283e-06, "loss": 1.3977, "step": 27683 }, { "epoch": 0.76, "learning_rate": 2.9624723293426103e-06, "loss": 1.1404, "step": 27684 }, { "epoch": 0.76, "learning_rate": 2.9618439631931062e-06, "loss": 1.1216, "step": 27685 }, { "epoch": 0.76, "learning_rate": 2.961215652106819e-06, "loss": 1.2107, "step": 27686 }, { "epoch": 0.76, "learning_rate": 2.9605873960886734e-06, "loss": 1.636, "step": 27687 }, { "epoch": 0.76, "learning_rate": 2.9599591951435792e-06, "loss": 1.3311, "step": 27688 }, { "epoch": 0.76, "learning_rate": 2.9593310492764606e-06, "loss": 1.3083, "step": 27689 }, { "epoch": 0.76, "learning_rate": 2.9587029584922177e-06, "loss": 1.2119, "step": 27690 }, { "epoch": 0.76, "learning_rate": 2.958074922795775e-06, "loss": 1.2791, "step": 27691 }, { "epoch": 0.76, "learning_rate": 2.9574469421920402e-06, "loss": 1.113, "step": 27692 }, { "epoch": 0.76, "learning_rate": 2.9568190166859346e-06, "loss": 1.2092, "step": 27693 }, { "epoch": 0.76, "learning_rate": 2.95619114628236e-06, "loss": 1.3018, "step": 27694 }, { "epoch": 0.76, "learning_rate": 2.955563330986235e-06, "loss": 1.1661, "step": 27695 }, { "epoch": 0.76, "learning_rate": 2.9549355708024684e-06, "loss": 1.2383, "step": 27696 }, { "epoch": 0.76, "learning_rate": 2.954307865735978e-06, "loss": 1.0657, "step": 27697 }, { "epoch": 0.76, "learning_rate": 2.9536802157916646e-06, "loss": 1.3787, "step": 27698 }, { "epoch": 0.76, "learning_rate": 2.953052620974444e-06, "loss": 1.2068, "step": 27699 }, { "epoch": 0.76, "learning_rate": 2.9524250812892284e-06, "loss": 1.2329, "step": 27700 }, { "epoch": 0.76, "learning_rate": 2.951797596740925e-06, "loss": 1.3987, "step": 27701 }, { "epoch": 0.76, "learning_rate": 2.951170167334443e-06, "loss": 1.241, "step": 27702 }, { "epoch": 0.76, "learning_rate": 2.9505427930746876e-06, "loss": 1.3064, "step": 27703 }, { "epoch": 0.76, "learning_rate": 2.9499154739665735e-06, "loss": 1.3755, "step": 27704 }, { "epoch": 0.76, "learning_rate": 2.9492882100150065e-06, "loss": 1.1606, "step": 27705 }, { "epoch": 0.76, "learning_rate": 2.9486610012248916e-06, "loss": 1.2063, "step": 27706 }, { "epoch": 0.76, "learning_rate": 2.948033847601136e-06, "loss": 1.3186, "step": 27707 }, { "epoch": 0.76, "learning_rate": 2.947406749148649e-06, "loss": 1.3457, "step": 27708 }, { "epoch": 0.76, "learning_rate": 2.946779705872336e-06, "loss": 1.1851, "step": 27709 }, { "epoch": 0.76, "learning_rate": 2.946152717777102e-06, "loss": 1.1256, "step": 27710 }, { "epoch": 0.76, "learning_rate": 2.9455257848678487e-06, "loss": 1.1812, "step": 27711 }, { "epoch": 0.76, "learning_rate": 2.944898907149488e-06, "loss": 1.3679, "step": 27712 }, { "epoch": 0.76, "learning_rate": 2.9442720846269203e-06, "loss": 1.3237, "step": 27713 }, { "epoch": 0.76, "learning_rate": 2.9436453173050496e-06, "loss": 1.1592, "step": 27714 }, { "epoch": 0.76, "learning_rate": 2.943018605188778e-06, "loss": 1.26, "step": 27715 }, { "epoch": 0.76, "learning_rate": 2.942391948283012e-06, "loss": 1.394, "step": 27716 }, { "epoch": 0.76, "learning_rate": 2.941765346592653e-06, "loss": 1.3528, "step": 27717 }, { "epoch": 0.76, "learning_rate": 2.9411388001226006e-06, "loss": 1.2876, "step": 27718 }, { "epoch": 0.76, "learning_rate": 2.9405123088777623e-06, "loss": 1.3398, "step": 27719 }, { "epoch": 0.76, "learning_rate": 2.939885872863035e-06, "loss": 1.2676, "step": 27720 }, { "epoch": 0.76, "learning_rate": 2.9392594920833205e-06, "loss": 1.2512, "step": 27721 }, { "epoch": 0.76, "learning_rate": 2.9386331665435177e-06, "loss": 1.2822, "step": 27722 }, { "epoch": 0.76, "learning_rate": 2.938006896248531e-06, "loss": 1.338, "step": 27723 }, { "epoch": 0.76, "learning_rate": 2.9373806812032567e-06, "loss": 1.3013, "step": 27724 }, { "epoch": 0.76, "learning_rate": 2.9367545214125958e-06, "loss": 1.2742, "step": 27725 }, { "epoch": 0.76, "learning_rate": 2.936128416881443e-06, "loss": 1.3088, "step": 27726 }, { "epoch": 0.76, "learning_rate": 2.935502367614703e-06, "loss": 1.3621, "step": 27727 }, { "epoch": 0.76, "learning_rate": 2.9348763736172704e-06, "loss": 1.4292, "step": 27728 }, { "epoch": 0.76, "learning_rate": 2.9342504348940437e-06, "loss": 1.2653, "step": 27729 }, { "epoch": 0.76, "learning_rate": 2.933624551449914e-06, "loss": 1.26, "step": 27730 }, { "epoch": 0.76, "learning_rate": 2.932998723289785e-06, "loss": 1.1532, "step": 27731 }, { "epoch": 0.76, "learning_rate": 2.932372950418555e-06, "loss": 1.262, "step": 27732 }, { "epoch": 0.76, "learning_rate": 2.9317472328411114e-06, "loss": 1.3823, "step": 27733 }, { "epoch": 0.76, "learning_rate": 2.9311215705623552e-06, "loss": 1.1987, "step": 27734 }, { "epoch": 0.76, "learning_rate": 2.9304959635871776e-06, "loss": 1.2219, "step": 27735 }, { "epoch": 0.76, "learning_rate": 2.9298704119204813e-06, "loss": 1.3318, "step": 27736 }, { "epoch": 0.76, "learning_rate": 2.9292449155671477e-06, "loss": 1.1144, "step": 27737 }, { "epoch": 0.76, "learning_rate": 2.9286194745320806e-06, "loss": 1.2476, "step": 27738 }, { "epoch": 0.76, "learning_rate": 2.9279940888201662e-06, "loss": 1.2766, "step": 27739 }, { "epoch": 0.76, "learning_rate": 2.9273687584363076e-06, "loss": 1.2036, "step": 27740 }, { "epoch": 0.76, "learning_rate": 2.9267434833853824e-06, "loss": 1.4399, "step": 27741 }, { "epoch": 0.76, "learning_rate": 2.926118263672294e-06, "loss": 1.3972, "step": 27742 }, { "epoch": 0.76, "learning_rate": 2.925493099301927e-06, "loss": 1.1863, "step": 27743 }, { "epoch": 0.76, "learning_rate": 2.924867990279181e-06, "loss": 1.2361, "step": 27744 }, { "epoch": 0.76, "learning_rate": 2.9242429366089343e-06, "loss": 1.2354, "step": 27745 }, { "epoch": 0.76, "learning_rate": 2.923617938296085e-06, "loss": 1.2874, "step": 27746 }, { "epoch": 0.76, "learning_rate": 2.9229929953455237e-06, "loss": 1.1449, "step": 27747 }, { "epoch": 0.76, "learning_rate": 2.9223681077621367e-06, "loss": 1.2117, "step": 27748 }, { "epoch": 0.76, "learning_rate": 2.921743275550815e-06, "loss": 1.3203, "step": 27749 }, { "epoch": 0.76, "learning_rate": 2.921118498716441e-06, "loss": 1.2891, "step": 27750 }, { "epoch": 0.76, "learning_rate": 2.920493777263911e-06, "loss": 1.1416, "step": 27751 }, { "epoch": 0.76, "learning_rate": 2.919869111198108e-06, "loss": 1.3584, "step": 27752 }, { "epoch": 0.76, "learning_rate": 2.91924450052392e-06, "loss": 1.2158, "step": 27753 }, { "epoch": 0.76, "learning_rate": 2.9186199452462305e-06, "loss": 1.4565, "step": 27754 }, { "epoch": 0.76, "learning_rate": 2.917995445369932e-06, "loss": 1.1697, "step": 27755 }, { "epoch": 0.76, "learning_rate": 2.917371000899907e-06, "loss": 1.1338, "step": 27756 }, { "epoch": 0.76, "learning_rate": 2.9167466118410404e-06, "loss": 1.4404, "step": 27757 }, { "epoch": 0.76, "learning_rate": 2.9161222781982147e-06, "loss": 1.2437, "step": 27758 }, { "epoch": 0.76, "learning_rate": 2.91549799997632e-06, "loss": 1.2842, "step": 27759 }, { "epoch": 0.76, "learning_rate": 2.9148737771802383e-06, "loss": 1.1577, "step": 27760 }, { "epoch": 0.76, "learning_rate": 2.914249609814849e-06, "loss": 1.1929, "step": 27761 }, { "epoch": 0.76, "learning_rate": 2.913625497885041e-06, "loss": 1.2205, "step": 27762 }, { "epoch": 0.76, "learning_rate": 2.9130014413956965e-06, "loss": 1.2769, "step": 27763 }, { "epoch": 0.76, "learning_rate": 2.9123774403516946e-06, "loss": 1.1011, "step": 27764 }, { "epoch": 0.76, "learning_rate": 2.911753494757916e-06, "loss": 1.2061, "step": 27765 }, { "epoch": 0.76, "learning_rate": 2.9111296046192495e-06, "loss": 1.2456, "step": 27766 }, { "epoch": 0.76, "learning_rate": 2.9105057699405704e-06, "loss": 1.3206, "step": 27767 }, { "epoch": 0.76, "learning_rate": 2.9098819907267606e-06, "loss": 1.2778, "step": 27768 }, { "epoch": 0.76, "learning_rate": 2.909258266982696e-06, "loss": 1.2239, "step": 27769 }, { "epoch": 0.76, "learning_rate": 2.9086345987132648e-06, "loss": 1.3247, "step": 27770 }, { "epoch": 0.76, "learning_rate": 2.908010985923342e-06, "loss": 1.332, "step": 27771 }, { "epoch": 0.76, "learning_rate": 2.907387428617805e-06, "loss": 1.2429, "step": 27772 }, { "epoch": 0.76, "learning_rate": 2.9067639268015313e-06, "loss": 1.3459, "step": 27773 }, { "epoch": 0.76, "learning_rate": 2.906140480479405e-06, "loss": 1.2634, "step": 27774 }, { "epoch": 0.76, "learning_rate": 2.905517089656299e-06, "loss": 1.4041, "step": 27775 }, { "epoch": 0.76, "learning_rate": 2.9048937543370915e-06, "loss": 1.2671, "step": 27776 }, { "epoch": 0.76, "learning_rate": 2.904270474526656e-06, "loss": 1.3181, "step": 27777 }, { "epoch": 0.76, "learning_rate": 2.903647250229871e-06, "loss": 1.1504, "step": 27778 }, { "epoch": 0.76, "learning_rate": 2.9030240814516197e-06, "loss": 1.3066, "step": 27779 }, { "epoch": 0.76, "learning_rate": 2.9024009681967637e-06, "loss": 1.0828, "step": 27780 }, { "epoch": 0.76, "learning_rate": 2.9017779104701893e-06, "loss": 1.3782, "step": 27781 }, { "epoch": 0.76, "learning_rate": 2.901154908276763e-06, "loss": 1.1427, "step": 27782 }, { "epoch": 0.76, "learning_rate": 2.9005319616213688e-06, "loss": 1.1304, "step": 27783 }, { "epoch": 0.76, "learning_rate": 2.8999090705088682e-06, "loss": 1.1709, "step": 27784 }, { "epoch": 0.76, "learning_rate": 2.899286234944143e-06, "loss": 1.3271, "step": 27785 }, { "epoch": 0.76, "learning_rate": 2.8986634549320603e-06, "loss": 1.2197, "step": 27786 }, { "epoch": 0.76, "learning_rate": 2.8980407304775015e-06, "loss": 1.1724, "step": 27787 }, { "epoch": 0.76, "learning_rate": 2.8974180615853266e-06, "loss": 1.198, "step": 27788 }, { "epoch": 0.76, "learning_rate": 2.8967954482604164e-06, "loss": 1.2231, "step": 27789 }, { "epoch": 0.76, "learning_rate": 2.896172890507635e-06, "loss": 1.2957, "step": 27790 }, { "epoch": 0.76, "learning_rate": 2.8955503883318627e-06, "loss": 1.2866, "step": 27791 }, { "epoch": 0.76, "learning_rate": 2.894927941737957e-06, "loss": 1.1792, "step": 27792 }, { "epoch": 0.76, "learning_rate": 2.8943055507307938e-06, "loss": 1.1843, "step": 27793 }, { "epoch": 0.76, "learning_rate": 2.893683215315246e-06, "loss": 1.2026, "step": 27794 }, { "epoch": 0.76, "learning_rate": 2.8930609354961794e-06, "loss": 1.0911, "step": 27795 }, { "epoch": 0.76, "learning_rate": 2.892438711278461e-06, "loss": 1.3867, "step": 27796 }, { "epoch": 0.76, "learning_rate": 2.8918165426669585e-06, "loss": 1.2617, "step": 27797 }, { "epoch": 0.76, "learning_rate": 2.891194429666543e-06, "loss": 1.3296, "step": 27798 }, { "epoch": 0.76, "learning_rate": 2.89057237228208e-06, "loss": 1.3787, "step": 27799 }, { "epoch": 0.76, "learning_rate": 2.889950370518435e-06, "loss": 1.384, "step": 27800 }, { "epoch": 0.76, "learning_rate": 2.889328424380472e-06, "loss": 1.3113, "step": 27801 }, { "epoch": 0.76, "learning_rate": 2.8887065338730634e-06, "loss": 1.2832, "step": 27802 }, { "epoch": 0.76, "learning_rate": 2.8880846990010702e-06, "loss": 1.2644, "step": 27803 }, { "epoch": 0.76, "learning_rate": 2.887462919769358e-06, "loss": 1.2712, "step": 27804 }, { "epoch": 0.76, "learning_rate": 2.8868411961827893e-06, "loss": 1.2742, "step": 27805 }, { "epoch": 0.76, "learning_rate": 2.8862195282462326e-06, "loss": 1.1934, "step": 27806 }, { "epoch": 0.76, "learning_rate": 2.8855979159645487e-06, "loss": 1.3433, "step": 27807 }, { "epoch": 0.76, "learning_rate": 2.8849763593425984e-06, "loss": 1.3086, "step": 27808 }, { "epoch": 0.76, "learning_rate": 2.884354858385251e-06, "loss": 1.2812, "step": 27809 }, { "epoch": 0.76, "learning_rate": 2.8837334130973647e-06, "loss": 1.3977, "step": 27810 }, { "epoch": 0.76, "learning_rate": 2.883112023483803e-06, "loss": 1.1729, "step": 27811 }, { "epoch": 0.76, "learning_rate": 2.882490689549422e-06, "loss": 1.1985, "step": 27812 }, { "epoch": 0.76, "learning_rate": 2.88186941129909e-06, "loss": 1.3311, "step": 27813 }, { "epoch": 0.76, "learning_rate": 2.8812481887376644e-06, "loss": 1.3223, "step": 27814 }, { "epoch": 0.76, "learning_rate": 2.8806270218700063e-06, "loss": 1.313, "step": 27815 }, { "epoch": 0.76, "learning_rate": 2.8800059107009714e-06, "loss": 1.6069, "step": 27816 }, { "epoch": 0.76, "learning_rate": 2.879384855235424e-06, "loss": 1.2627, "step": 27817 }, { "epoch": 0.76, "learning_rate": 2.8787638554782227e-06, "loss": 1.2136, "step": 27818 }, { "epoch": 0.76, "learning_rate": 2.878142911434224e-06, "loss": 1.3147, "step": 27819 }, { "epoch": 0.76, "learning_rate": 2.8775220231082833e-06, "loss": 1.2905, "step": 27820 }, { "epoch": 0.76, "learning_rate": 2.8769011905052634e-06, "loss": 1.1836, "step": 27821 }, { "epoch": 0.76, "learning_rate": 2.876280413630019e-06, "loss": 1.0784, "step": 27822 }, { "epoch": 0.76, "learning_rate": 2.8756596924874045e-06, "loss": 1.3308, "step": 27823 }, { "epoch": 0.76, "learning_rate": 2.8750390270822814e-06, "loss": 1.2141, "step": 27824 }, { "epoch": 0.76, "learning_rate": 2.8744184174195e-06, "loss": 1.1753, "step": 27825 }, { "epoch": 0.76, "learning_rate": 2.873797863503923e-06, "loss": 1.2642, "step": 27826 }, { "epoch": 0.76, "learning_rate": 2.873177365340395e-06, "loss": 1.4316, "step": 27827 }, { "epoch": 0.76, "learning_rate": 2.87255692293378e-06, "loss": 1.2598, "step": 27828 }, { "epoch": 0.76, "learning_rate": 2.871936536288924e-06, "loss": 1.3877, "step": 27829 }, { "epoch": 0.76, "learning_rate": 2.8713162054106913e-06, "loss": 1.0483, "step": 27830 }, { "epoch": 0.76, "learning_rate": 2.8706959303039215e-06, "loss": 1.3328, "step": 27831 }, { "epoch": 0.76, "learning_rate": 2.8700757109734776e-06, "loss": 1.3911, "step": 27832 }, { "epoch": 0.76, "learning_rate": 2.869455547424207e-06, "loss": 1.2708, "step": 27833 }, { "epoch": 0.76, "learning_rate": 2.8688354396609676e-06, "loss": 1.1411, "step": 27834 }, { "epoch": 0.76, "learning_rate": 2.868215387688601e-06, "loss": 1.4092, "step": 27835 }, { "epoch": 0.76, "learning_rate": 2.867595391511967e-06, "loss": 1.3062, "step": 27836 }, { "epoch": 0.76, "learning_rate": 2.8669754511359092e-06, "loss": 1.2039, "step": 27837 }, { "epoch": 0.76, "learning_rate": 2.866355566565284e-06, "loss": 1.2578, "step": 27838 }, { "epoch": 0.76, "learning_rate": 2.8657357378049387e-06, "loss": 1.313, "step": 27839 }, { "epoch": 0.76, "learning_rate": 2.865115964859719e-06, "loss": 1.2095, "step": 27840 }, { "epoch": 0.76, "learning_rate": 2.864496247734481e-06, "loss": 1.3132, "step": 27841 }, { "epoch": 0.76, "learning_rate": 2.8638765864340677e-06, "loss": 1.1301, "step": 27842 }, { "epoch": 0.76, "learning_rate": 2.8632569809633293e-06, "loss": 1.0632, "step": 27843 }, { "epoch": 0.76, "learning_rate": 2.8626374313271087e-06, "loss": 1.1963, "step": 27844 }, { "epoch": 0.76, "learning_rate": 2.8620179375302604e-06, "loss": 1.261, "step": 27845 }, { "epoch": 0.76, "learning_rate": 2.861398499577627e-06, "loss": 1.3857, "step": 27846 }, { "epoch": 0.76, "learning_rate": 2.860779117474054e-06, "loss": 1.2256, "step": 27847 }, { "epoch": 0.76, "learning_rate": 2.8601597912243863e-06, "loss": 1.2451, "step": 27848 }, { "epoch": 0.76, "learning_rate": 2.8595405208334727e-06, "loss": 1.1863, "step": 27849 }, { "epoch": 0.76, "learning_rate": 2.8589213063061574e-06, "loss": 1.1956, "step": 27850 }, { "epoch": 0.76, "learning_rate": 2.858302147647284e-06, "loss": 1.3242, "step": 27851 }, { "epoch": 0.76, "learning_rate": 2.857683044861692e-06, "loss": 1.3237, "step": 27852 }, { "epoch": 0.76, "learning_rate": 2.8570639979542337e-06, "loss": 1.3447, "step": 27853 }, { "epoch": 0.76, "learning_rate": 2.856445006929747e-06, "loss": 1.2339, "step": 27854 }, { "epoch": 0.76, "learning_rate": 2.855826071793073e-06, "loss": 1.7466, "step": 27855 }, { "epoch": 0.76, "learning_rate": 2.8552071925490587e-06, "loss": 1.3206, "step": 27856 }, { "epoch": 0.76, "learning_rate": 2.8545883692025444e-06, "loss": 1.322, "step": 27857 }, { "epoch": 0.76, "learning_rate": 2.8539696017583696e-06, "loss": 1.1816, "step": 27858 }, { "epoch": 0.76, "learning_rate": 2.8533508902213746e-06, "loss": 1.3477, "step": 27859 }, { "epoch": 0.76, "learning_rate": 2.8527322345964036e-06, "loss": 1.1963, "step": 27860 }, { "epoch": 0.76, "learning_rate": 2.852113634888296e-06, "loss": 1.1621, "step": 27861 }, { "epoch": 0.76, "learning_rate": 2.851495091101889e-06, "loss": 1.2627, "step": 27862 }, { "epoch": 0.76, "learning_rate": 2.85087660324202e-06, "loss": 1.293, "step": 27863 }, { "epoch": 0.76, "learning_rate": 2.850258171313535e-06, "loss": 1.2949, "step": 27864 }, { "epoch": 0.76, "learning_rate": 2.8496397953212663e-06, "loss": 1.354, "step": 27865 }, { "epoch": 0.76, "learning_rate": 2.849021475270054e-06, "loss": 1.3105, "step": 27866 }, { "epoch": 0.76, "learning_rate": 2.848403211164733e-06, "loss": 1.3235, "step": 27867 }, { "epoch": 0.76, "learning_rate": 2.847785003010144e-06, "loss": 1.2754, "step": 27868 }, { "epoch": 0.76, "learning_rate": 2.847166850811123e-06, "loss": 1.1238, "step": 27869 }, { "epoch": 0.76, "learning_rate": 2.8465487545725013e-06, "loss": 1.2156, "step": 27870 }, { "epoch": 0.76, "learning_rate": 2.845930714299122e-06, "loss": 1.2866, "step": 27871 }, { "epoch": 0.76, "learning_rate": 2.8453127299958126e-06, "loss": 1.293, "step": 27872 }, { "epoch": 0.76, "learning_rate": 2.844694801667416e-06, "loss": 1.2542, "step": 27873 }, { "epoch": 0.76, "learning_rate": 2.844076929318763e-06, "loss": 1.4019, "step": 27874 }, { "epoch": 0.76, "learning_rate": 2.843459112954686e-06, "loss": 1.3179, "step": 27875 }, { "epoch": 0.76, "learning_rate": 2.842841352580018e-06, "loss": 1.2812, "step": 27876 }, { "epoch": 0.76, "learning_rate": 2.8422236481995956e-06, "loss": 1.1321, "step": 27877 }, { "epoch": 0.76, "learning_rate": 2.84160599981825e-06, "loss": 1.1111, "step": 27878 }, { "epoch": 0.76, "learning_rate": 2.8409884074408133e-06, "loss": 1.2581, "step": 27879 }, { "epoch": 0.76, "learning_rate": 2.8403708710721133e-06, "loss": 1.145, "step": 27880 }, { "epoch": 0.76, "learning_rate": 2.8397533907169884e-06, "loss": 1.3281, "step": 27881 }, { "epoch": 0.76, "learning_rate": 2.839135966380265e-06, "loss": 1.3362, "step": 27882 }, { "epoch": 0.76, "learning_rate": 2.838518598066775e-06, "loss": 1.3625, "step": 27883 }, { "epoch": 0.76, "learning_rate": 2.837901285781346e-06, "loss": 1.1011, "step": 27884 }, { "epoch": 0.76, "learning_rate": 2.8372840295288106e-06, "loss": 1.2405, "step": 27885 }, { "epoch": 0.76, "learning_rate": 2.8366668293139986e-06, "loss": 1.3877, "step": 27886 }, { "epoch": 0.76, "learning_rate": 2.836049685141733e-06, "loss": 1.2644, "step": 27887 }, { "epoch": 0.76, "learning_rate": 2.8354325970168483e-06, "loss": 1.364, "step": 27888 }, { "epoch": 0.76, "learning_rate": 2.834815564944171e-06, "loss": 1.2241, "step": 27889 }, { "epoch": 0.76, "learning_rate": 2.834198588928527e-06, "loss": 1.04, "step": 27890 }, { "epoch": 0.76, "learning_rate": 2.833581668974741e-06, "loss": 1.4536, "step": 27891 }, { "epoch": 0.76, "learning_rate": 2.8329648050876446e-06, "loss": 1.2305, "step": 27892 }, { "epoch": 0.76, "learning_rate": 2.8323479972720622e-06, "loss": 1.3518, "step": 27893 }, { "epoch": 0.76, "learning_rate": 2.831731245532818e-06, "loss": 1.3125, "step": 27894 }, { "epoch": 0.76, "learning_rate": 2.831114549874735e-06, "loss": 1.187, "step": 27895 }, { "epoch": 0.76, "learning_rate": 2.8304979103026433e-06, "loss": 1.4941, "step": 27896 }, { "epoch": 0.76, "learning_rate": 2.8298813268213645e-06, "loss": 1.22, "step": 27897 }, { "epoch": 0.76, "learning_rate": 2.8292647994357236e-06, "loss": 1.1953, "step": 27898 }, { "epoch": 0.76, "learning_rate": 2.8286483281505397e-06, "loss": 1.3904, "step": 27899 }, { "epoch": 0.76, "learning_rate": 2.8280319129706413e-06, "loss": 1.3035, "step": 27900 }, { "epoch": 0.76, "learning_rate": 2.8274155539008486e-06, "loss": 1.2781, "step": 27901 }, { "epoch": 0.76, "learning_rate": 2.826799250945982e-06, "loss": 1.1941, "step": 27902 }, { "epoch": 0.76, "learning_rate": 2.826183004110867e-06, "loss": 1.1187, "step": 27903 }, { "epoch": 0.76, "learning_rate": 2.82556681340032e-06, "loss": 1.3274, "step": 27904 }, { "epoch": 0.76, "learning_rate": 2.8249506788191703e-06, "loss": 1.3584, "step": 27905 }, { "epoch": 0.76, "learning_rate": 2.8243346003722273e-06, "loss": 1.2678, "step": 27906 }, { "epoch": 0.76, "learning_rate": 2.8237185780643195e-06, "loss": 1.199, "step": 27907 }, { "epoch": 0.76, "learning_rate": 2.823102611900259e-06, "loss": 1.0798, "step": 27908 }, { "epoch": 0.76, "learning_rate": 2.8224867018848746e-06, "loss": 1.6655, "step": 27909 }, { "epoch": 0.76, "learning_rate": 2.821870848022974e-06, "loss": 1.1694, "step": 27910 }, { "epoch": 0.76, "learning_rate": 2.8212550503193837e-06, "loss": 1.1711, "step": 27911 }, { "epoch": 0.76, "learning_rate": 2.820639308778914e-06, "loss": 1.2961, "step": 27912 }, { "epoch": 0.76, "learning_rate": 2.8200236234063936e-06, "loss": 1.1428, "step": 27913 }, { "epoch": 0.76, "learning_rate": 2.8194079942066253e-06, "loss": 1.6855, "step": 27914 }, { "epoch": 0.76, "learning_rate": 2.8187924211844363e-06, "loss": 1.2107, "step": 27915 }, { "epoch": 0.76, "learning_rate": 2.818176904344634e-06, "loss": 1.2461, "step": 27916 }, { "epoch": 0.76, "learning_rate": 2.8175614436920428e-06, "loss": 1.1853, "step": 27917 }, { "epoch": 0.76, "learning_rate": 2.816946039231473e-06, "loss": 1.2822, "step": 27918 }, { "epoch": 0.76, "learning_rate": 2.8163306909677366e-06, "loss": 1.302, "step": 27919 }, { "epoch": 0.76, "learning_rate": 2.815715398905654e-06, "loss": 1.3325, "step": 27920 }, { "epoch": 0.76, "learning_rate": 2.8151001630500353e-06, "loss": 1.2834, "step": 27921 }, { "epoch": 0.76, "learning_rate": 2.8144849834056955e-06, "loss": 1.2915, "step": 27922 }, { "epoch": 0.76, "learning_rate": 2.813869859977443e-06, "loss": 1.2776, "step": 27923 }, { "epoch": 0.76, "learning_rate": 2.813254792770096e-06, "loss": 1.252, "step": 27924 }, { "epoch": 0.76, "learning_rate": 2.812639781788464e-06, "loss": 1.4563, "step": 27925 }, { "epoch": 0.76, "learning_rate": 2.8120248270373583e-06, "loss": 1.3359, "step": 27926 }, { "epoch": 0.76, "learning_rate": 2.811409928521588e-06, "loss": 1.3406, "step": 27927 }, { "epoch": 0.76, "learning_rate": 2.81079508624597e-06, "loss": 1.2534, "step": 27928 }, { "epoch": 0.76, "learning_rate": 2.8101803002153093e-06, "loss": 1.4363, "step": 27929 }, { "epoch": 0.76, "learning_rate": 2.809565570434417e-06, "loss": 1.2146, "step": 27930 }, { "epoch": 0.76, "learning_rate": 2.8089508969081e-06, "loss": 1.3147, "step": 27931 }, { "epoch": 0.76, "learning_rate": 2.808336279641173e-06, "loss": 1.3999, "step": 27932 }, { "epoch": 0.76, "learning_rate": 2.807721718638441e-06, "loss": 1.2952, "step": 27933 }, { "epoch": 0.76, "learning_rate": 2.8071072139047083e-06, "loss": 1.3706, "step": 27934 }, { "epoch": 0.76, "learning_rate": 2.8064927654447906e-06, "loss": 1.2007, "step": 27935 }, { "epoch": 0.76, "learning_rate": 2.80587837326349e-06, "loss": 1.1392, "step": 27936 }, { "epoch": 0.76, "learning_rate": 2.805264037365615e-06, "loss": 1.2249, "step": 27937 }, { "epoch": 0.76, "learning_rate": 2.8046497577559674e-06, "loss": 1.2175, "step": 27938 }, { "epoch": 0.76, "learning_rate": 2.80403553443936e-06, "loss": 1.301, "step": 27939 }, { "epoch": 0.76, "learning_rate": 2.8034213674205936e-06, "loss": 1.1873, "step": 27940 }, { "epoch": 0.76, "learning_rate": 2.802807256704475e-06, "loss": 1.3789, "step": 27941 }, { "epoch": 0.76, "learning_rate": 2.8021932022958052e-06, "loss": 1.3669, "step": 27942 }, { "epoch": 0.76, "learning_rate": 2.801579204199395e-06, "loss": 1.264, "step": 27943 }, { "epoch": 0.76, "learning_rate": 2.8009652624200436e-06, "loss": 1.2878, "step": 27944 }, { "epoch": 0.76, "learning_rate": 2.8003513769625544e-06, "loss": 1.1489, "step": 27945 }, { "epoch": 0.76, "learning_rate": 2.799737547831728e-06, "loss": 1.6729, "step": 27946 }, { "epoch": 0.76, "learning_rate": 2.7991237750323685e-06, "loss": 1.2876, "step": 27947 }, { "epoch": 0.76, "learning_rate": 2.7985100585692847e-06, "loss": 1.1057, "step": 27948 }, { "epoch": 0.76, "learning_rate": 2.797896398447266e-06, "loss": 1.1278, "step": 27949 }, { "epoch": 0.76, "learning_rate": 2.7972827946711224e-06, "loss": 1.1335, "step": 27950 }, { "epoch": 0.76, "learning_rate": 2.7966692472456482e-06, "loss": 1.4856, "step": 27951 }, { "epoch": 0.76, "learning_rate": 2.796055756175653e-06, "loss": 1.0427, "step": 27952 }, { "epoch": 0.76, "learning_rate": 2.7954423214659232e-06, "loss": 1.1572, "step": 27953 }, { "epoch": 0.76, "learning_rate": 2.7948289431212684e-06, "loss": 1.4446, "step": 27954 }, { "epoch": 0.76, "learning_rate": 2.79421562114648e-06, "loss": 1.0179, "step": 27955 }, { "epoch": 0.76, "learning_rate": 2.7936023555463663e-06, "loss": 1.2649, "step": 27956 }, { "epoch": 0.76, "learning_rate": 2.7929891463257142e-06, "loss": 1.2341, "step": 27957 }, { "epoch": 0.76, "learning_rate": 2.792375993489328e-06, "loss": 1.1008, "step": 27958 }, { "epoch": 0.76, "learning_rate": 2.7917628970420006e-06, "loss": 1.3989, "step": 27959 }, { "epoch": 0.76, "learning_rate": 2.7911498569885364e-06, "loss": 1.2739, "step": 27960 }, { "epoch": 0.76, "learning_rate": 2.79053687333372e-06, "loss": 1.2446, "step": 27961 }, { "epoch": 0.76, "learning_rate": 2.7899239460823557e-06, "loss": 1.2671, "step": 27962 }, { "epoch": 0.76, "learning_rate": 2.7893110752392328e-06, "loss": 1.2476, "step": 27963 }, { "epoch": 0.76, "learning_rate": 2.788698260809153e-06, "loss": 1.3127, "step": 27964 }, { "epoch": 0.76, "learning_rate": 2.7880855027969066e-06, "loss": 1.1091, "step": 27965 }, { "epoch": 0.76, "learning_rate": 2.787472801207285e-06, "loss": 1.1956, "step": 27966 }, { "epoch": 0.76, "learning_rate": 2.786860156045087e-06, "loss": 1.1948, "step": 27967 }, { "epoch": 0.76, "learning_rate": 2.7862475673151047e-06, "loss": 1.1963, "step": 27968 }, { "epoch": 0.76, "learning_rate": 2.7856350350221285e-06, "loss": 1.2429, "step": 27969 }, { "epoch": 0.76, "learning_rate": 2.785022559170948e-06, "loss": 1.3767, "step": 27970 }, { "epoch": 0.76, "learning_rate": 2.7844101397663615e-06, "loss": 1.2773, "step": 27971 }, { "epoch": 0.76, "learning_rate": 2.7837977768131575e-06, "loss": 1.2893, "step": 27972 }, { "epoch": 0.76, "learning_rate": 2.7831854703161253e-06, "loss": 1.3447, "step": 27973 }, { "epoch": 0.76, "learning_rate": 2.782573220280055e-06, "loss": 1.2866, "step": 27974 }, { "epoch": 0.76, "learning_rate": 2.7819610267097396e-06, "loss": 1.3247, "step": 27975 }, { "epoch": 0.76, "learning_rate": 2.7813488896099672e-06, "loss": 1.3401, "step": 27976 }, { "epoch": 0.76, "learning_rate": 2.780736808985528e-06, "loss": 1.1509, "step": 27977 }, { "epoch": 0.76, "learning_rate": 2.780124784841205e-06, "loss": 1.123, "step": 27978 }, { "epoch": 0.76, "learning_rate": 2.7795128171817932e-06, "loss": 1.199, "step": 27979 }, { "epoch": 0.76, "learning_rate": 2.7789009060120786e-06, "loss": 1.2371, "step": 27980 }, { "epoch": 0.76, "learning_rate": 2.778289051336844e-06, "loss": 1.3604, "step": 27981 }, { "epoch": 0.76, "learning_rate": 2.7776772531608842e-06, "loss": 1.2109, "step": 27982 }, { "epoch": 0.76, "learning_rate": 2.777065511488981e-06, "loss": 1.6821, "step": 27983 }, { "epoch": 0.76, "learning_rate": 2.77645382632592e-06, "loss": 1.1885, "step": 27984 }, { "epoch": 0.76, "learning_rate": 2.775842197676486e-06, "loss": 1.406, "step": 27985 }, { "epoch": 0.76, "learning_rate": 2.7752306255454673e-06, "loss": 1.2542, "step": 27986 }, { "epoch": 0.76, "learning_rate": 2.7746191099376475e-06, "loss": 1.1702, "step": 27987 }, { "epoch": 0.76, "learning_rate": 2.7740076508578094e-06, "loss": 1.241, "step": 27988 }, { "epoch": 0.76, "learning_rate": 2.773396248310735e-06, "loss": 1.1921, "step": 27989 }, { "epoch": 0.76, "learning_rate": 2.7727849023012134e-06, "loss": 1.4253, "step": 27990 }, { "epoch": 0.76, "learning_rate": 2.7721736128340237e-06, "loss": 1.2253, "step": 27991 }, { "epoch": 0.76, "learning_rate": 2.7715623799139493e-06, "loss": 1.1323, "step": 27992 }, { "epoch": 0.76, "learning_rate": 2.7709512035457687e-06, "loss": 1.3953, "step": 27993 }, { "epoch": 0.76, "learning_rate": 2.7703400837342664e-06, "loss": 1.21, "step": 27994 }, { "epoch": 0.76, "learning_rate": 2.76972902048423e-06, "loss": 1.1492, "step": 27995 }, { "epoch": 0.76, "learning_rate": 2.7691180138004282e-06, "loss": 1.1047, "step": 27996 }, { "epoch": 0.76, "learning_rate": 2.7685070636876486e-06, "loss": 1.2019, "step": 27997 }, { "epoch": 0.76, "learning_rate": 2.767896170150667e-06, "loss": 1.3706, "step": 27998 }, { "epoch": 0.76, "learning_rate": 2.767285333194272e-06, "loss": 1.2253, "step": 27999 }, { "epoch": 0.76, "learning_rate": 2.7666745528232276e-06, "loss": 1.3083, "step": 28000 }, { "epoch": 0.76, "learning_rate": 2.7660638290423237e-06, "loss": 1.1663, "step": 28001 }, { "epoch": 0.76, "learning_rate": 2.765453161856333e-06, "loss": 1.3542, "step": 28002 }, { "epoch": 0.76, "learning_rate": 2.7648425512700393e-06, "loss": 1.2058, "step": 28003 }, { "epoch": 0.76, "learning_rate": 2.7642319972882102e-06, "loss": 1.4927, "step": 28004 }, { "epoch": 0.76, "learning_rate": 2.7636214999156298e-06, "loss": 1.3767, "step": 28005 }, { "epoch": 0.76, "learning_rate": 2.763011059157069e-06, "loss": 1.1689, "step": 28006 }, { "epoch": 0.76, "learning_rate": 2.762400675017314e-06, "loss": 1.2141, "step": 28007 }, { "epoch": 0.76, "learning_rate": 2.7617903475011252e-06, "loss": 1.196, "step": 28008 }, { "epoch": 0.76, "learning_rate": 2.761180076613286e-06, "loss": 1.342, "step": 28009 }, { "epoch": 0.76, "learning_rate": 2.760569862358572e-06, "loss": 1.2998, "step": 28010 }, { "epoch": 0.76, "learning_rate": 2.759959704741756e-06, "loss": 1.2776, "step": 28011 }, { "epoch": 0.76, "learning_rate": 2.7593496037676105e-06, "loss": 1.3823, "step": 28012 }, { "epoch": 0.77, "learning_rate": 2.758739559440905e-06, "loss": 1.2595, "step": 28013 }, { "epoch": 0.77, "learning_rate": 2.75812957176642e-06, "loss": 1.2056, "step": 28014 }, { "epoch": 0.77, "learning_rate": 2.7575196407489245e-06, "loss": 1.3633, "step": 28015 }, { "epoch": 0.77, "learning_rate": 2.7569097663931888e-06, "loss": 1.189, "step": 28016 }, { "epoch": 0.77, "learning_rate": 2.7562999487039822e-06, "loss": 1.23, "step": 28017 }, { "epoch": 0.77, "learning_rate": 2.755690187686082e-06, "loss": 1.1489, "step": 28018 }, { "epoch": 0.77, "learning_rate": 2.7550804833442547e-06, "loss": 1.2036, "step": 28019 }, { "epoch": 0.77, "learning_rate": 2.7544708356832717e-06, "loss": 1.3643, "step": 28020 }, { "epoch": 0.77, "learning_rate": 2.753861244707898e-06, "loss": 1.1506, "step": 28021 }, { "epoch": 0.77, "learning_rate": 2.7532517104229095e-06, "loss": 1.1973, "step": 28022 }, { "epoch": 0.77, "learning_rate": 2.7526422328330726e-06, "loss": 1.3335, "step": 28023 }, { "epoch": 0.77, "learning_rate": 2.752032811943155e-06, "loss": 1.2424, "step": 28024 }, { "epoch": 0.77, "learning_rate": 2.7514234477579205e-06, "loss": 1.3589, "step": 28025 }, { "epoch": 0.77, "learning_rate": 2.750814140282144e-06, "loss": 1.1606, "step": 28026 }, { "epoch": 0.77, "learning_rate": 2.750204889520589e-06, "loss": 1.301, "step": 28027 }, { "epoch": 0.77, "learning_rate": 2.749595695478019e-06, "loss": 1.2561, "step": 28028 }, { "epoch": 0.77, "learning_rate": 2.7489865581592045e-06, "loss": 1.2598, "step": 28029 }, { "epoch": 0.77, "learning_rate": 2.748377477568911e-06, "loss": 1.1709, "step": 28030 }, { "epoch": 0.77, "learning_rate": 2.747768453711902e-06, "loss": 1.2209, "step": 28031 }, { "epoch": 0.77, "learning_rate": 2.7471594865929387e-06, "loss": 1.2754, "step": 28032 }, { "epoch": 0.77, "learning_rate": 2.7465505762167934e-06, "loss": 1.376, "step": 28033 }, { "epoch": 0.77, "learning_rate": 2.7459417225882248e-06, "loss": 1.2771, "step": 28034 }, { "epoch": 0.77, "learning_rate": 2.7453329257119965e-06, "loss": 1.1564, "step": 28035 }, { "epoch": 0.77, "learning_rate": 2.7447241855928686e-06, "loss": 1.2454, "step": 28036 }, { "epoch": 0.77, "learning_rate": 2.7441155022356113e-06, "loss": 1.259, "step": 28037 }, { "epoch": 0.77, "learning_rate": 2.7435068756449823e-06, "loss": 1.3691, "step": 28038 }, { "epoch": 0.77, "learning_rate": 2.742898305825743e-06, "loss": 1.2043, "step": 28039 }, { "epoch": 0.77, "learning_rate": 2.742289792782651e-06, "loss": 1.3279, "step": 28040 }, { "epoch": 0.77, "learning_rate": 2.741681336520472e-06, "loss": 1.3108, "step": 28041 }, { "epoch": 0.77, "learning_rate": 2.74107293704397e-06, "loss": 1.3455, "step": 28042 }, { "epoch": 0.77, "learning_rate": 2.7404645943578947e-06, "loss": 1.2104, "step": 28043 }, { "epoch": 0.77, "learning_rate": 2.739856308467014e-06, "loss": 1.2041, "step": 28044 }, { "epoch": 0.77, "learning_rate": 2.73924807937608e-06, "loss": 1.2039, "step": 28045 }, { "epoch": 0.77, "learning_rate": 2.7386399070898604e-06, "loss": 1.4224, "step": 28046 }, { "epoch": 0.77, "learning_rate": 2.738031791613103e-06, "loss": 1.2861, "step": 28047 }, { "epoch": 0.77, "learning_rate": 2.7374237329505725e-06, "loss": 1.1951, "step": 28048 }, { "epoch": 0.77, "learning_rate": 2.73681573110702e-06, "loss": 1.2915, "step": 28049 }, { "epoch": 0.77, "learning_rate": 2.736207786087213e-06, "loss": 1.342, "step": 28050 }, { "epoch": 0.77, "learning_rate": 2.7355998978958933e-06, "loss": 1.2571, "step": 28051 }, { "epoch": 0.77, "learning_rate": 2.7349920665378273e-06, "loss": 1.3452, "step": 28052 }, { "epoch": 0.77, "learning_rate": 2.734384292017764e-06, "loss": 1.3108, "step": 28053 }, { "epoch": 0.77, "learning_rate": 2.7337765743404686e-06, "loss": 1.355, "step": 28054 }, { "epoch": 0.77, "learning_rate": 2.733168913510681e-06, "loss": 1.1375, "step": 28055 }, { "epoch": 0.77, "learning_rate": 2.7325613095331637e-06, "loss": 1.2307, "step": 28056 }, { "epoch": 0.77, "learning_rate": 2.7319537624126724e-06, "loss": 1.3167, "step": 28057 }, { "epoch": 0.77, "learning_rate": 2.7313462721539564e-06, "loss": 1.3359, "step": 28058 }, { "epoch": 0.77, "learning_rate": 2.7307388387617694e-06, "loss": 1.272, "step": 28059 }, { "epoch": 0.77, "learning_rate": 2.7301314622408613e-06, "loss": 1.4382, "step": 28060 }, { "epoch": 0.77, "learning_rate": 2.7295241425959885e-06, "loss": 1.196, "step": 28061 }, { "epoch": 0.77, "learning_rate": 2.7289168798319e-06, "loss": 1.4102, "step": 28062 }, { "epoch": 0.77, "learning_rate": 2.7283096739533466e-06, "loss": 1.2861, "step": 28063 }, { "epoch": 0.77, "learning_rate": 2.727702524965076e-06, "loss": 1.324, "step": 28064 }, { "epoch": 0.77, "learning_rate": 2.7270954328718447e-06, "loss": 1.3779, "step": 28065 }, { "epoch": 0.77, "learning_rate": 2.7264883976783987e-06, "loss": 1.4229, "step": 28066 }, { "epoch": 0.77, "learning_rate": 2.7258814193894866e-06, "loss": 1.2522, "step": 28067 }, { "epoch": 0.77, "learning_rate": 2.7252744980098544e-06, "loss": 1.3535, "step": 28068 }, { "epoch": 0.77, "learning_rate": 2.7246676335442578e-06, "loss": 1.1743, "step": 28069 }, { "epoch": 0.77, "learning_rate": 2.7240608259974397e-06, "loss": 1.1768, "step": 28070 }, { "epoch": 0.77, "learning_rate": 2.7234540753741457e-06, "loss": 1.272, "step": 28071 }, { "epoch": 0.77, "learning_rate": 2.722847381679128e-06, "loss": 1.3303, "step": 28072 }, { "epoch": 0.77, "learning_rate": 2.722240744917131e-06, "loss": 1.1135, "step": 28073 }, { "epoch": 0.77, "learning_rate": 2.7216341650929e-06, "loss": 1.2854, "step": 28074 }, { "epoch": 0.77, "learning_rate": 2.721027642211178e-06, "loss": 1.241, "step": 28075 }, { "epoch": 0.77, "learning_rate": 2.720421176276715e-06, "loss": 1.709, "step": 28076 }, { "epoch": 0.77, "learning_rate": 2.7198147672942543e-06, "loss": 1.3748, "step": 28077 }, { "epoch": 0.77, "learning_rate": 2.7192084152685394e-06, "loss": 1.1702, "step": 28078 }, { "epoch": 0.77, "learning_rate": 2.7186021202043113e-06, "loss": 1.2686, "step": 28079 }, { "epoch": 0.77, "learning_rate": 2.717995882106319e-06, "loss": 1.1836, "step": 28080 }, { "epoch": 0.77, "learning_rate": 2.7173897009793026e-06, "loss": 1.3389, "step": 28081 }, { "epoch": 0.77, "learning_rate": 2.716783576828005e-06, "loss": 1.2351, "step": 28082 }, { "epoch": 0.77, "learning_rate": 2.7161775096571654e-06, "loss": 1.1276, "step": 28083 }, { "epoch": 0.77, "learning_rate": 2.71557149947153e-06, "loss": 1.1721, "step": 28084 }, { "epoch": 0.77, "learning_rate": 2.714965546275837e-06, "loss": 1.5115, "step": 28085 }, { "epoch": 0.77, "learning_rate": 2.714359650074829e-06, "loss": 1.3933, "step": 28086 }, { "epoch": 0.77, "learning_rate": 2.7137538108732432e-06, "loss": 1.2917, "step": 28087 }, { "epoch": 0.77, "learning_rate": 2.7131480286758193e-06, "loss": 1.3511, "step": 28088 }, { "epoch": 0.77, "learning_rate": 2.7125423034873054e-06, "loss": 1.2041, "step": 28089 }, { "epoch": 0.77, "learning_rate": 2.7119366353124288e-06, "loss": 1.3311, "step": 28090 }, { "epoch": 0.77, "learning_rate": 2.711331024155934e-06, "loss": 1.2996, "step": 28091 }, { "epoch": 0.77, "learning_rate": 2.710725470022556e-06, "loss": 1.1521, "step": 28092 }, { "epoch": 0.77, "learning_rate": 2.7101199729170404e-06, "loss": 1.4192, "step": 28093 }, { "epoch": 0.77, "learning_rate": 2.709514532844112e-06, "loss": 1.1243, "step": 28094 }, { "epoch": 0.77, "learning_rate": 2.7089091498085176e-06, "loss": 1.2153, "step": 28095 }, { "epoch": 0.77, "learning_rate": 2.708303823814985e-06, "loss": 1.1714, "step": 28096 }, { "epoch": 0.77, "learning_rate": 2.7076985548682613e-06, "loss": 1.1208, "step": 28097 }, { "epoch": 0.77, "learning_rate": 2.7070933429730686e-06, "loss": 1.2411, "step": 28098 }, { "epoch": 0.77, "learning_rate": 2.7064881881341507e-06, "loss": 1.2185, "step": 28099 }, { "epoch": 0.77, "learning_rate": 2.705883090356237e-06, "loss": 1.2368, "step": 28100 }, { "epoch": 0.77, "learning_rate": 2.705278049644068e-06, "loss": 1.2202, "step": 28101 }, { "epoch": 0.77, "learning_rate": 2.704673066002372e-06, "loss": 1.4163, "step": 28102 }, { "epoch": 0.77, "learning_rate": 2.7040681394358813e-06, "loss": 1.0437, "step": 28103 }, { "epoch": 0.77, "learning_rate": 2.7034632699493334e-06, "loss": 1.2092, "step": 28104 }, { "epoch": 0.77, "learning_rate": 2.702858457547458e-06, "loss": 1.3354, "step": 28105 }, { "epoch": 0.77, "learning_rate": 2.702253702234986e-06, "loss": 1.2668, "step": 28106 }, { "epoch": 0.77, "learning_rate": 2.7016490040166476e-06, "loss": 1.2998, "step": 28107 }, { "epoch": 0.77, "learning_rate": 2.701044362897177e-06, "loss": 1.3223, "step": 28108 }, { "epoch": 0.77, "learning_rate": 2.700439778881304e-06, "loss": 1.2842, "step": 28109 }, { "epoch": 0.77, "learning_rate": 2.699835251973758e-06, "loss": 1.2642, "step": 28110 }, { "epoch": 0.77, "learning_rate": 2.699230782179264e-06, "loss": 1.1016, "step": 28111 }, { "epoch": 0.77, "learning_rate": 2.6986263695025596e-06, "loss": 1.1885, "step": 28112 }, { "epoch": 0.77, "learning_rate": 2.698022013948368e-06, "loss": 1.384, "step": 28113 }, { "epoch": 0.77, "learning_rate": 2.6974177155214197e-06, "loss": 1.2234, "step": 28114 }, { "epoch": 0.77, "learning_rate": 2.6968134742264374e-06, "loss": 1.2551, "step": 28115 }, { "epoch": 0.77, "learning_rate": 2.696209290068156e-06, "loss": 1.2336, "step": 28116 }, { "epoch": 0.77, "learning_rate": 2.695605163051298e-06, "loss": 1.283, "step": 28117 }, { "epoch": 0.77, "learning_rate": 2.695001093180588e-06, "loss": 1.2542, "step": 28118 }, { "epoch": 0.77, "learning_rate": 2.6943970804607567e-06, "loss": 1.1095, "step": 28119 }, { "epoch": 0.77, "learning_rate": 2.6937931248965276e-06, "loss": 1.1904, "step": 28120 }, { "epoch": 0.77, "learning_rate": 2.693189226492625e-06, "loss": 1.3379, "step": 28121 }, { "epoch": 0.77, "learning_rate": 2.692585385253772e-06, "loss": 1.2839, "step": 28122 }, { "epoch": 0.77, "learning_rate": 2.691981601184698e-06, "loss": 1.3301, "step": 28123 }, { "epoch": 0.77, "learning_rate": 2.691377874290122e-06, "loss": 1.1279, "step": 28124 }, { "epoch": 0.77, "learning_rate": 2.6907742045747696e-06, "loss": 1.166, "step": 28125 }, { "epoch": 0.77, "learning_rate": 2.6901705920433598e-06, "loss": 1.1748, "step": 28126 }, { "epoch": 0.77, "learning_rate": 2.689567036700621e-06, "loss": 1.2476, "step": 28127 }, { "epoch": 0.77, "learning_rate": 2.688963538551271e-06, "loss": 1.3391, "step": 28128 }, { "epoch": 0.77, "learning_rate": 2.6883600976000334e-06, "loss": 1.1094, "step": 28129 }, { "epoch": 0.77, "learning_rate": 2.687756713851626e-06, "loss": 1.2273, "step": 28130 }, { "epoch": 0.77, "learning_rate": 2.6871533873107737e-06, "loss": 1.1846, "step": 28131 }, { "epoch": 0.77, "learning_rate": 2.686550117982194e-06, "loss": 1.2139, "step": 28132 }, { "epoch": 0.77, "learning_rate": 2.6859469058706078e-06, "loss": 1.7915, "step": 28133 }, { "epoch": 0.77, "learning_rate": 2.685343750980731e-06, "loss": 1.186, "step": 28134 }, { "epoch": 0.77, "learning_rate": 2.684740653317285e-06, "loss": 1.2373, "step": 28135 }, { "epoch": 0.77, "learning_rate": 2.6841376128849905e-06, "loss": 1.2146, "step": 28136 }, { "epoch": 0.77, "learning_rate": 2.683534629688563e-06, "loss": 1.3386, "step": 28137 }, { "epoch": 0.77, "learning_rate": 2.6829317037327217e-06, "loss": 1.3367, "step": 28138 }, { "epoch": 0.77, "learning_rate": 2.6823288350221777e-06, "loss": 1.2849, "step": 28139 }, { "epoch": 0.77, "learning_rate": 2.681726023561655e-06, "loss": 1.3491, "step": 28140 }, { "epoch": 0.77, "learning_rate": 2.6811232693558674e-06, "loss": 1.291, "step": 28141 }, { "epoch": 0.77, "learning_rate": 2.6805205724095295e-06, "loss": 1.0618, "step": 28142 }, { "epoch": 0.77, "learning_rate": 2.679917932727353e-06, "loss": 1.1558, "step": 28143 }, { "epoch": 0.77, "learning_rate": 2.6793153503140602e-06, "loss": 1.3567, "step": 28144 }, { "epoch": 0.77, "learning_rate": 2.678712825174361e-06, "loss": 1.1497, "step": 28145 }, { "epoch": 0.77, "learning_rate": 2.6781103573129706e-06, "loss": 1.2375, "step": 28146 }, { "epoch": 0.77, "learning_rate": 2.6775079467345987e-06, "loss": 1.2761, "step": 28147 }, { "epoch": 0.77, "learning_rate": 2.6769055934439634e-06, "loss": 1.3389, "step": 28148 }, { "epoch": 0.77, "learning_rate": 2.676303297445777e-06, "loss": 1.416, "step": 28149 }, { "epoch": 0.77, "learning_rate": 2.675701058744745e-06, "loss": 1.2031, "step": 28150 }, { "epoch": 0.77, "learning_rate": 2.675098877345588e-06, "loss": 1.2266, "step": 28151 }, { "epoch": 0.77, "learning_rate": 2.674496753253012e-06, "loss": 1.3176, "step": 28152 }, { "epoch": 0.77, "learning_rate": 2.6738946864717295e-06, "loss": 1.3015, "step": 28153 }, { "epoch": 0.77, "learning_rate": 2.673292677006447e-06, "loss": 1.198, "step": 28154 }, { "epoch": 0.77, "learning_rate": 2.6726907248618794e-06, "loss": 1.3025, "step": 28155 }, { "epoch": 0.77, "learning_rate": 2.672088830042735e-06, "loss": 1.3506, "step": 28156 }, { "epoch": 0.77, "learning_rate": 2.671486992553721e-06, "loss": 1.2878, "step": 28157 }, { "epoch": 0.77, "learning_rate": 2.6708852123995444e-06, "loss": 1.2261, "step": 28158 }, { "epoch": 0.77, "learning_rate": 2.6702834895849184e-06, "loss": 1.7227, "step": 28159 }, { "epoch": 0.77, "learning_rate": 2.6696818241145474e-06, "loss": 1.0874, "step": 28160 }, { "epoch": 0.77, "learning_rate": 2.6690802159931397e-06, "loss": 1.3115, "step": 28161 }, { "epoch": 0.77, "learning_rate": 2.6684786652253967e-06, "loss": 1.2996, "step": 28162 }, { "epoch": 0.77, "learning_rate": 2.667877171816032e-06, "loss": 1.1575, "step": 28163 }, { "epoch": 0.77, "learning_rate": 2.6672757357697497e-06, "loss": 1.2249, "step": 28164 }, { "epoch": 0.77, "learning_rate": 2.666674357091251e-06, "loss": 1.3191, "step": 28165 }, { "epoch": 0.77, "learning_rate": 2.666073035785246e-06, "loss": 1.2327, "step": 28166 }, { "epoch": 0.77, "learning_rate": 2.665471771856435e-06, "loss": 1.354, "step": 28167 }, { "epoch": 0.77, "learning_rate": 2.6648705653095287e-06, "loss": 1.3, "step": 28168 }, { "epoch": 0.77, "learning_rate": 2.66426941614922e-06, "loss": 1.1628, "step": 28169 }, { "epoch": 0.77, "learning_rate": 2.6636683243802207e-06, "loss": 1.2458, "step": 28170 }, { "epoch": 0.77, "learning_rate": 2.6630672900072287e-06, "loss": 1.2896, "step": 28171 }, { "epoch": 0.77, "learning_rate": 2.6624663130349537e-06, "loss": 1.3489, "step": 28172 }, { "epoch": 0.77, "learning_rate": 2.661865393468086e-06, "loss": 1.2351, "step": 28173 }, { "epoch": 0.77, "learning_rate": 2.661264531311335e-06, "loss": 1.1304, "step": 28174 }, { "epoch": 0.77, "learning_rate": 2.660663726569398e-06, "loss": 1.3989, "step": 28175 }, { "epoch": 0.77, "learning_rate": 2.660062979246981e-06, "loss": 1.2007, "step": 28176 }, { "epoch": 0.77, "learning_rate": 2.6594622893487756e-06, "loss": 1.1599, "step": 28177 }, { "epoch": 0.77, "learning_rate": 2.658861656879487e-06, "loss": 1.2235, "step": 28178 }, { "epoch": 0.77, "learning_rate": 2.65826108184381e-06, "loss": 1.178, "step": 28179 }, { "epoch": 0.77, "learning_rate": 2.6576605642464494e-06, "loss": 1.3491, "step": 28180 }, { "epoch": 0.77, "learning_rate": 2.6570601040920996e-06, "loss": 1.1667, "step": 28181 }, { "epoch": 0.77, "learning_rate": 2.656459701385455e-06, "loss": 1.1887, "step": 28182 }, { "epoch": 0.77, "learning_rate": 2.655859356131221e-06, "loss": 1.2966, "step": 28183 }, { "epoch": 0.77, "learning_rate": 2.6552590683340897e-06, "loss": 1.2649, "step": 28184 }, { "epoch": 0.77, "learning_rate": 2.654658837998757e-06, "loss": 1.1152, "step": 28185 }, { "epoch": 0.77, "learning_rate": 2.654058665129917e-06, "loss": 1.2969, "step": 28186 }, { "epoch": 0.77, "learning_rate": 2.6534585497322705e-06, "loss": 1.2422, "step": 28187 }, { "epoch": 0.77, "learning_rate": 2.6528584918105092e-06, "loss": 1.2571, "step": 28188 }, { "epoch": 0.77, "learning_rate": 2.6522584913693295e-06, "loss": 1.4585, "step": 28189 }, { "epoch": 0.77, "learning_rate": 2.6516585484134194e-06, "loss": 1.2266, "step": 28190 }, { "epoch": 0.77, "learning_rate": 2.6510586629474823e-06, "loss": 1.7183, "step": 28191 }, { "epoch": 0.77, "learning_rate": 2.650458834976205e-06, "loss": 1.2039, "step": 28192 }, { "epoch": 0.77, "learning_rate": 2.649859064504282e-06, "loss": 1.1929, "step": 28193 }, { "epoch": 0.77, "learning_rate": 2.649259351536403e-06, "loss": 1.2024, "step": 28194 }, { "epoch": 0.77, "learning_rate": 2.648659696077266e-06, "loss": 1.2097, "step": 28195 }, { "epoch": 0.77, "learning_rate": 2.6480600981315573e-06, "loss": 1.2883, "step": 28196 }, { "epoch": 0.77, "learning_rate": 2.647460557703967e-06, "loss": 1.2751, "step": 28197 }, { "epoch": 0.77, "learning_rate": 2.646861074799191e-06, "loss": 1.4702, "step": 28198 }, { "epoch": 0.77, "learning_rate": 2.6462616494219152e-06, "loss": 1.2715, "step": 28199 }, { "epoch": 0.77, "learning_rate": 2.6456622815768305e-06, "loss": 1.0745, "step": 28200 }, { "epoch": 0.77, "learning_rate": 2.6450629712686237e-06, "loss": 1.2927, "step": 28201 }, { "epoch": 0.77, "learning_rate": 2.6444637185019883e-06, "loss": 1.2029, "step": 28202 }, { "epoch": 0.77, "learning_rate": 2.6438645232816096e-06, "loss": 1.0742, "step": 28203 }, { "epoch": 0.77, "learning_rate": 2.643265385612176e-06, "loss": 1.0333, "step": 28204 }, { "epoch": 0.77, "learning_rate": 2.6426663054983724e-06, "loss": 1.2264, "step": 28205 }, { "epoch": 0.77, "learning_rate": 2.64206728294489e-06, "loss": 1.1011, "step": 28206 }, { "epoch": 0.77, "learning_rate": 2.641468317956414e-06, "loss": 1.2458, "step": 28207 }, { "epoch": 0.77, "learning_rate": 2.6408694105376285e-06, "loss": 1.3149, "step": 28208 }, { "epoch": 0.77, "learning_rate": 2.640270560693219e-06, "loss": 1.1382, "step": 28209 }, { "epoch": 0.77, "learning_rate": 2.6396717684278727e-06, "loss": 1.3246, "step": 28210 }, { "epoch": 0.77, "learning_rate": 2.6390730337462743e-06, "loss": 1.2646, "step": 28211 }, { "epoch": 0.77, "learning_rate": 2.6384743566531047e-06, "loss": 1.291, "step": 28212 }, { "epoch": 0.77, "learning_rate": 2.6378757371530527e-06, "loss": 1.2527, "step": 28213 }, { "epoch": 0.77, "learning_rate": 2.6372771752507963e-06, "loss": 1.1335, "step": 28214 }, { "epoch": 0.77, "learning_rate": 2.6366786709510274e-06, "loss": 1.2739, "step": 28215 }, { "epoch": 0.77, "learning_rate": 2.636080224258415e-06, "loss": 1.3032, "step": 28216 }, { "epoch": 0.77, "learning_rate": 2.635481835177651e-06, "loss": 1.3079, "step": 28217 }, { "epoch": 0.77, "learning_rate": 2.6348835037134126e-06, "loss": 1.4116, "step": 28218 }, { "epoch": 0.77, "learning_rate": 2.634285229870387e-06, "loss": 1.2661, "step": 28219 }, { "epoch": 0.77, "learning_rate": 2.6336870136532455e-06, "loss": 1.2671, "step": 28220 }, { "epoch": 0.77, "learning_rate": 2.6330888550666744e-06, "loss": 1.1736, "step": 28221 }, { "epoch": 0.77, "learning_rate": 2.63249075411535e-06, "loss": 1.3718, "step": 28222 }, { "epoch": 0.77, "learning_rate": 2.6318927108039594e-06, "loss": 1.1782, "step": 28223 }, { "epoch": 0.77, "learning_rate": 2.631294725137169e-06, "loss": 1.2566, "step": 28224 }, { "epoch": 0.77, "learning_rate": 2.6306967971196673e-06, "loss": 1.3979, "step": 28225 }, { "epoch": 0.77, "learning_rate": 2.630098926756125e-06, "loss": 1.4089, "step": 28226 }, { "epoch": 0.77, "learning_rate": 2.629501114051226e-06, "loss": 1.2324, "step": 28227 }, { "epoch": 0.77, "learning_rate": 2.6289033590096447e-06, "loss": 1.1577, "step": 28228 }, { "epoch": 0.77, "learning_rate": 2.628305661636055e-06, "loss": 1.2219, "step": 28229 }, { "epoch": 0.77, "learning_rate": 2.627708021935137e-06, "loss": 1.3135, "step": 28230 }, { "epoch": 0.77, "learning_rate": 2.6271104399115655e-06, "loss": 1.2771, "step": 28231 }, { "epoch": 0.77, "learning_rate": 2.626512915570015e-06, "loss": 1.2314, "step": 28232 }, { "epoch": 0.77, "learning_rate": 2.625915448915157e-06, "loss": 1.2507, "step": 28233 }, { "epoch": 0.77, "learning_rate": 2.6253180399516733e-06, "loss": 1.2629, "step": 28234 }, { "epoch": 0.77, "learning_rate": 2.6247206886842312e-06, "loss": 1.0894, "step": 28235 }, { "epoch": 0.77, "learning_rate": 2.6241233951175083e-06, "loss": 1.2141, "step": 28236 }, { "epoch": 0.77, "learning_rate": 2.6235261592561712e-06, "loss": 1.2683, "step": 28237 }, { "epoch": 0.77, "learning_rate": 2.6229289811049007e-06, "loss": 1.3589, "step": 28238 }, { "epoch": 0.77, "learning_rate": 2.6223318606683647e-06, "loss": 1.3123, "step": 28239 }, { "epoch": 0.77, "learning_rate": 2.6217347979512342e-06, "loss": 1.1786, "step": 28240 }, { "epoch": 0.77, "learning_rate": 2.621137792958178e-06, "loss": 1.3433, "step": 28241 }, { "epoch": 0.77, "learning_rate": 2.620540845693874e-06, "loss": 1.3074, "step": 28242 }, { "epoch": 0.77, "learning_rate": 2.619943956162988e-06, "loss": 1.2471, "step": 28243 }, { "epoch": 0.77, "learning_rate": 2.619347124370187e-06, "loss": 1.0801, "step": 28244 }, { "epoch": 0.77, "learning_rate": 2.618750350320147e-06, "loss": 1.3074, "step": 28245 }, { "epoch": 0.77, "learning_rate": 2.6181536340175327e-06, "loss": 1.2512, "step": 28246 }, { "epoch": 0.77, "learning_rate": 2.6175569754670138e-06, "loss": 1.1873, "step": 28247 }, { "epoch": 0.77, "learning_rate": 2.616960374673254e-06, "loss": 1.0262, "step": 28248 }, { "epoch": 0.77, "learning_rate": 2.616363831640928e-06, "loss": 1.2512, "step": 28249 }, { "epoch": 0.77, "learning_rate": 2.615767346374699e-06, "loss": 1.3098, "step": 28250 }, { "epoch": 0.77, "learning_rate": 2.615170918879234e-06, "loss": 1.3113, "step": 28251 }, { "epoch": 0.77, "learning_rate": 2.6145745491591967e-06, "loss": 1.4275, "step": 28252 }, { "epoch": 0.77, "learning_rate": 2.613978237219258e-06, "loss": 1.3052, "step": 28253 }, { "epoch": 0.77, "learning_rate": 2.6133819830640795e-06, "loss": 1.271, "step": 28254 }, { "epoch": 0.77, "learning_rate": 2.612785786698329e-06, "loss": 1.3357, "step": 28255 }, { "epoch": 0.77, "learning_rate": 2.612189648126664e-06, "loss": 1.238, "step": 28256 }, { "epoch": 0.77, "learning_rate": 2.6115935673537563e-06, "loss": 1.1477, "step": 28257 }, { "epoch": 0.77, "learning_rate": 2.6109975443842663e-06, "loss": 1.3623, "step": 28258 }, { "epoch": 0.77, "learning_rate": 2.6104015792228543e-06, "loss": 1.2839, "step": 28259 }, { "epoch": 0.77, "learning_rate": 2.6098056718741883e-06, "loss": 1.2314, "step": 28260 }, { "epoch": 0.77, "learning_rate": 2.6092098223429253e-06, "loss": 1.2529, "step": 28261 }, { "epoch": 0.77, "learning_rate": 2.608614030633735e-06, "loss": 1.3103, "step": 28262 }, { "epoch": 0.77, "learning_rate": 2.608018296751266e-06, "loss": 1.2161, "step": 28263 }, { "epoch": 0.77, "learning_rate": 2.6074226207001897e-06, "loss": 1.2147, "step": 28264 }, { "epoch": 0.77, "learning_rate": 2.6068270024851594e-06, "loss": 1.2122, "step": 28265 }, { "epoch": 0.77, "learning_rate": 2.6062314421108436e-06, "loss": 1.1992, "step": 28266 }, { "epoch": 0.77, "learning_rate": 2.605635939581891e-06, "loss": 1.1936, "step": 28267 }, { "epoch": 0.77, "learning_rate": 2.6050404949029682e-06, "loss": 1.3359, "step": 28268 }, { "epoch": 0.77, "learning_rate": 2.6044451080787293e-06, "loss": 1.2222, "step": 28269 }, { "epoch": 0.77, "learning_rate": 2.6038497791138385e-06, "loss": 1.3547, "step": 28270 }, { "epoch": 0.77, "learning_rate": 2.6032545080129446e-06, "loss": 1.3877, "step": 28271 }, { "epoch": 0.77, "learning_rate": 2.6026592947807116e-06, "loss": 1.1733, "step": 28272 }, { "epoch": 0.77, "learning_rate": 2.6020641394217903e-06, "loss": 1.2617, "step": 28273 }, { "epoch": 0.77, "learning_rate": 2.6014690419408438e-06, "loss": 1.4192, "step": 28274 }, { "epoch": 0.77, "learning_rate": 2.6008740023425248e-06, "loss": 1.1445, "step": 28275 }, { "epoch": 0.77, "learning_rate": 2.6002790206314855e-06, "loss": 1.1599, "step": 28276 }, { "epoch": 0.77, "learning_rate": 2.599684096812386e-06, "loss": 1.1968, "step": 28277 }, { "epoch": 0.77, "learning_rate": 2.5990892308898783e-06, "loss": 1.1365, "step": 28278 }, { "epoch": 0.77, "learning_rate": 2.598494422868616e-06, "loss": 1.2688, "step": 28279 }, { "epoch": 0.77, "learning_rate": 2.5978996727532514e-06, "loss": 1.291, "step": 28280 }, { "epoch": 0.77, "learning_rate": 2.5973049805484407e-06, "loss": 1.2646, "step": 28281 }, { "epoch": 0.77, "learning_rate": 2.596710346258835e-06, "loss": 1.3779, "step": 28282 }, { "epoch": 0.77, "learning_rate": 2.596115769889086e-06, "loss": 1.2397, "step": 28283 }, { "epoch": 0.77, "learning_rate": 2.5955212514438432e-06, "loss": 1.2075, "step": 28284 }, { "epoch": 0.77, "learning_rate": 2.594926790927763e-06, "loss": 1.1208, "step": 28285 }, { "epoch": 0.77, "learning_rate": 2.594332388345494e-06, "loss": 1.77, "step": 28286 }, { "epoch": 0.77, "learning_rate": 2.5937380437016858e-06, "loss": 1.134, "step": 28287 }, { "epoch": 0.77, "learning_rate": 2.5931437570009855e-06, "loss": 1.2209, "step": 28288 }, { "epoch": 0.77, "learning_rate": 2.592549528248047e-06, "loss": 1.1741, "step": 28289 }, { "epoch": 0.77, "learning_rate": 2.5919553574475198e-06, "loss": 1.5308, "step": 28290 }, { "epoch": 0.77, "learning_rate": 2.591361244604047e-06, "loss": 1.353, "step": 28291 }, { "epoch": 0.77, "learning_rate": 2.590767189722282e-06, "loss": 1.0862, "step": 28292 }, { "epoch": 0.77, "learning_rate": 2.5901731928068717e-06, "loss": 1.1851, "step": 28293 }, { "epoch": 0.77, "learning_rate": 2.589579253862461e-06, "loss": 1.2009, "step": 28294 }, { "epoch": 0.77, "learning_rate": 2.588985372893695e-06, "loss": 1.436, "step": 28295 }, { "epoch": 0.77, "learning_rate": 2.588391549905226e-06, "loss": 1.2483, "step": 28296 }, { "epoch": 0.77, "learning_rate": 2.5877977849016954e-06, "loss": 1.2573, "step": 28297 }, { "epoch": 0.77, "learning_rate": 2.5872040778877505e-06, "loss": 1.3364, "step": 28298 }, { "epoch": 0.77, "learning_rate": 2.5866104288680314e-06, "loss": 1.4185, "step": 28299 }, { "epoch": 0.77, "learning_rate": 2.5860168378471895e-06, "loss": 1.114, "step": 28300 }, { "epoch": 0.77, "learning_rate": 2.585423304829865e-06, "loss": 1.2332, "step": 28301 }, { "epoch": 0.77, "learning_rate": 2.5848298298207033e-06, "loss": 1.2947, "step": 28302 }, { "epoch": 0.77, "learning_rate": 2.5842364128243423e-06, "loss": 1.127, "step": 28303 }, { "epoch": 0.77, "learning_rate": 2.583643053845428e-06, "loss": 1.1406, "step": 28304 }, { "epoch": 0.77, "learning_rate": 2.58304975288861e-06, "loss": 1.2678, "step": 28305 }, { "epoch": 0.77, "learning_rate": 2.5824565099585164e-06, "loss": 1.1992, "step": 28306 }, { "epoch": 0.77, "learning_rate": 2.581863325059798e-06, "loss": 1.3025, "step": 28307 }, { "epoch": 0.77, "learning_rate": 2.58127019819709e-06, "loss": 1.3198, "step": 28308 }, { "epoch": 0.77, "learning_rate": 2.580677129375042e-06, "loss": 1.2939, "step": 28309 }, { "epoch": 0.77, "learning_rate": 2.5800841185982804e-06, "loss": 1.0635, "step": 28310 }, { "epoch": 0.77, "learning_rate": 2.579491165871455e-06, "loss": 1.2124, "step": 28311 }, { "epoch": 0.77, "learning_rate": 2.578898271199198e-06, "loss": 1.4014, "step": 28312 }, { "epoch": 0.77, "learning_rate": 2.578305434586158e-06, "loss": 1.219, "step": 28313 }, { "epoch": 0.77, "learning_rate": 2.5777126560369604e-06, "loss": 1.1846, "step": 28314 }, { "epoch": 0.77, "learning_rate": 2.57711993555625e-06, "loss": 1.1809, "step": 28315 }, { "epoch": 0.77, "learning_rate": 2.5765272731486623e-06, "loss": 1.3398, "step": 28316 }, { "epoch": 0.77, "learning_rate": 2.575934668818839e-06, "loss": 1.2642, "step": 28317 }, { "epoch": 0.77, "learning_rate": 2.5753421225714057e-06, "loss": 1.3169, "step": 28318 }, { "epoch": 0.77, "learning_rate": 2.574749634411008e-06, "loss": 1.2847, "step": 28319 }, { "epoch": 0.77, "learning_rate": 2.5741572043422738e-06, "loss": 1.3884, "step": 28320 }, { "epoch": 0.77, "learning_rate": 2.573564832369845e-06, "loss": 1.2605, "step": 28321 }, { "epoch": 0.77, "learning_rate": 2.5729725184983533e-06, "loss": 1.3994, "step": 28322 }, { "epoch": 0.77, "learning_rate": 2.572380262732429e-06, "loss": 1.3267, "step": 28323 }, { "epoch": 0.77, "learning_rate": 2.5717880650767114e-06, "loss": 1.2131, "step": 28324 }, { "epoch": 0.77, "learning_rate": 2.571195925535831e-06, "loss": 1.3267, "step": 28325 }, { "epoch": 0.77, "learning_rate": 2.570603844114421e-06, "loss": 1.3857, "step": 28326 }, { "epoch": 0.77, "learning_rate": 2.5700118208171086e-06, "loss": 1.4065, "step": 28327 }, { "epoch": 0.77, "learning_rate": 2.569419855648535e-06, "loss": 1.219, "step": 28328 }, { "epoch": 0.77, "learning_rate": 2.568827948613325e-06, "loss": 1.2568, "step": 28329 }, { "epoch": 0.77, "learning_rate": 2.5682360997161105e-06, "loss": 1.2629, "step": 28330 }, { "epoch": 0.77, "learning_rate": 2.56764430896152e-06, "loss": 1.688, "step": 28331 }, { "epoch": 0.77, "learning_rate": 2.5670525763541875e-06, "loss": 1.2576, "step": 28332 }, { "epoch": 0.77, "learning_rate": 2.566460901898742e-06, "loss": 1.2251, "step": 28333 }, { "epoch": 0.77, "learning_rate": 2.565869285599809e-06, "loss": 1.2346, "step": 28334 }, { "epoch": 0.77, "learning_rate": 2.5652777274620167e-06, "loss": 1.0527, "step": 28335 }, { "epoch": 0.77, "learning_rate": 2.5646862274899987e-06, "loss": 0.9751, "step": 28336 }, { "epoch": 0.77, "learning_rate": 2.564094785688379e-06, "loss": 1.239, "step": 28337 }, { "epoch": 0.77, "learning_rate": 2.563503402061782e-06, "loss": 1.6143, "step": 28338 }, { "epoch": 0.77, "learning_rate": 2.562912076614842e-06, "loss": 1.3542, "step": 28339 }, { "epoch": 0.77, "learning_rate": 2.562320809352179e-06, "loss": 1.3337, "step": 28340 }, { "epoch": 0.77, "learning_rate": 2.5617296002784208e-06, "loss": 1.3447, "step": 28341 }, { "epoch": 0.77, "learning_rate": 2.5611384493981893e-06, "loss": 1.2415, "step": 28342 }, { "epoch": 0.77, "learning_rate": 2.5605473567161165e-06, "loss": 1.134, "step": 28343 }, { "epoch": 0.77, "learning_rate": 2.559956322236823e-06, "loss": 1.1287, "step": 28344 }, { "epoch": 0.77, "learning_rate": 2.5593653459649314e-06, "loss": 1.1152, "step": 28345 }, { "epoch": 0.77, "learning_rate": 2.558774427905064e-06, "loss": 1.2498, "step": 28346 }, { "epoch": 0.77, "learning_rate": 2.5581835680618495e-06, "loss": 1.2644, "step": 28347 }, { "epoch": 0.77, "learning_rate": 2.557592766439908e-06, "loss": 1.2354, "step": 28348 }, { "epoch": 0.77, "learning_rate": 2.55700202304386e-06, "loss": 1.2078, "step": 28349 }, { "epoch": 0.77, "learning_rate": 2.5564113378783263e-06, "loss": 1.3967, "step": 28350 }, { "epoch": 0.77, "learning_rate": 2.5558207109479295e-06, "loss": 1.3315, "step": 28351 }, { "epoch": 0.77, "learning_rate": 2.555230142257297e-06, "loss": 1.1938, "step": 28352 }, { "epoch": 0.77, "learning_rate": 2.5546396318110365e-06, "loss": 1.2341, "step": 28353 }, { "epoch": 0.77, "learning_rate": 2.5540491796137777e-06, "loss": 1.2979, "step": 28354 }, { "epoch": 0.77, "learning_rate": 2.5534587856701344e-06, "loss": 1.2576, "step": 28355 }, { "epoch": 0.77, "learning_rate": 2.5528684499847333e-06, "loss": 1.3203, "step": 28356 }, { "epoch": 0.77, "learning_rate": 2.5522781725621814e-06, "loss": 1.3538, "step": 28357 }, { "epoch": 0.77, "learning_rate": 2.551687953407107e-06, "loss": 1.2979, "step": 28358 }, { "epoch": 0.77, "learning_rate": 2.55109779252412e-06, "loss": 1.2002, "step": 28359 }, { "epoch": 0.77, "learning_rate": 2.5505076899178473e-06, "loss": 1.3638, "step": 28360 }, { "epoch": 0.77, "learning_rate": 2.5499176455928933e-06, "loss": 1.2844, "step": 28361 }, { "epoch": 0.77, "learning_rate": 2.549327659553883e-06, "loss": 1.3613, "step": 28362 }, { "epoch": 0.77, "learning_rate": 2.5487377318054276e-06, "loss": 1.3325, "step": 28363 }, { "epoch": 0.77, "learning_rate": 2.5481478623521493e-06, "loss": 1.2234, "step": 28364 }, { "epoch": 0.77, "learning_rate": 2.547558051198652e-06, "loss": 1.3528, "step": 28365 }, { "epoch": 0.77, "learning_rate": 2.546968298349557e-06, "loss": 1.3779, "step": 28366 }, { "epoch": 0.77, "learning_rate": 2.5463786038094796e-06, "loss": 1.3079, "step": 28367 }, { "epoch": 0.77, "learning_rate": 2.5457889675830316e-06, "loss": 1.2017, "step": 28368 }, { "epoch": 0.77, "learning_rate": 2.5451993896748252e-06, "loss": 1.2002, "step": 28369 }, { "epoch": 0.77, "learning_rate": 2.5446098700894693e-06, "loss": 1.7271, "step": 28370 }, { "epoch": 0.77, "learning_rate": 2.5440204088315844e-06, "loss": 1.2388, "step": 28371 }, { "epoch": 0.77, "learning_rate": 2.5434310059057774e-06, "loss": 1.1868, "step": 28372 }, { "epoch": 0.77, "learning_rate": 2.5428416613166597e-06, "loss": 1.2749, "step": 28373 }, { "epoch": 0.77, "learning_rate": 2.54225237506884e-06, "loss": 1.2542, "step": 28374 }, { "epoch": 0.77, "learning_rate": 2.541663147166933e-06, "loss": 1.3044, "step": 28375 }, { "epoch": 0.77, "learning_rate": 2.541073977615547e-06, "loss": 1.3201, "step": 28376 }, { "epoch": 0.77, "learning_rate": 2.5404848664192894e-06, "loss": 1.2104, "step": 28377 }, { "epoch": 0.77, "learning_rate": 2.539895813582769e-06, "loss": 1.3308, "step": 28378 }, { "epoch": 0.78, "learning_rate": 2.5393068191105986e-06, "loss": 1.3242, "step": 28379 }, { "epoch": 0.78, "learning_rate": 2.538717883007382e-06, "loss": 1.1304, "step": 28380 }, { "epoch": 0.78, "learning_rate": 2.53812900527773e-06, "loss": 1.3413, "step": 28381 }, { "epoch": 0.78, "learning_rate": 2.537540185926244e-06, "loss": 1.3521, "step": 28382 }, { "epoch": 0.78, "learning_rate": 2.5369514249575377e-06, "loss": 1.2686, "step": 28383 }, { "epoch": 0.78, "learning_rate": 2.536362722376213e-06, "loss": 1.2073, "step": 28384 }, { "epoch": 0.78, "learning_rate": 2.5357740781868755e-06, "loss": 1.2244, "step": 28385 }, { "epoch": 0.78, "learning_rate": 2.535185492394133e-06, "loss": 1.1926, "step": 28386 }, { "epoch": 0.78, "learning_rate": 2.5345969650025904e-06, "loss": 1.3059, "step": 28387 }, { "epoch": 0.78, "learning_rate": 2.5340084960168497e-06, "loss": 1.1633, "step": 28388 }, { "epoch": 0.78, "learning_rate": 2.5334200854415135e-06, "loss": 1.1277, "step": 28389 }, { "epoch": 0.78, "learning_rate": 2.5328317332811903e-06, "loss": 1.3245, "step": 28390 }, { "epoch": 0.78, "learning_rate": 2.5322434395404792e-06, "loss": 1.2847, "step": 28391 }, { "epoch": 0.78, "learning_rate": 2.531655204223985e-06, "loss": 1.3691, "step": 28392 }, { "epoch": 0.78, "learning_rate": 2.5310670273363057e-06, "loss": 1.2725, "step": 28393 }, { "epoch": 0.78, "learning_rate": 2.530478908882048e-06, "loss": 1.2351, "step": 28394 }, { "epoch": 0.78, "learning_rate": 2.5298908488658125e-06, "loss": 1.2532, "step": 28395 }, { "epoch": 0.78, "learning_rate": 2.5293028472921966e-06, "loss": 1.1599, "step": 28396 }, { "epoch": 0.78, "learning_rate": 2.5287149041658e-06, "loss": 1.1663, "step": 28397 }, { "epoch": 0.78, "learning_rate": 2.5281270194912243e-06, "loss": 1.8105, "step": 28398 }, { "epoch": 0.78, "learning_rate": 2.527539193273073e-06, "loss": 1.2112, "step": 28399 }, { "epoch": 0.78, "learning_rate": 2.526951425515941e-06, "loss": 1.374, "step": 28400 }, { "epoch": 0.78, "learning_rate": 2.526363716224427e-06, "loss": 1.2803, "step": 28401 }, { "epoch": 0.78, "learning_rate": 2.525776065403126e-06, "loss": 1.3335, "step": 28402 }, { "epoch": 0.78, "learning_rate": 2.525188473056641e-06, "loss": 1.2861, "step": 28403 }, { "epoch": 0.78, "learning_rate": 2.5246009391895665e-06, "loss": 1.3467, "step": 28404 }, { "epoch": 0.78, "learning_rate": 2.5240134638064996e-06, "loss": 1.2739, "step": 28405 }, { "epoch": 0.78, "learning_rate": 2.523426046912032e-06, "loss": 1.375, "step": 28406 }, { "epoch": 0.78, "learning_rate": 2.5228386885107668e-06, "loss": 1.1638, "step": 28407 }, { "epoch": 0.78, "learning_rate": 2.522251388607296e-06, "loss": 1.2544, "step": 28408 }, { "epoch": 0.78, "learning_rate": 2.5216641472062144e-06, "loss": 1.2498, "step": 28409 }, { "epoch": 0.78, "learning_rate": 2.5210769643121123e-06, "loss": 1.3403, "step": 28410 }, { "epoch": 0.78, "learning_rate": 2.52048983992959e-06, "loss": 1.3491, "step": 28411 }, { "epoch": 0.78, "learning_rate": 2.5199027740632385e-06, "loss": 1.0771, "step": 28412 }, { "epoch": 0.78, "learning_rate": 2.519315766717647e-06, "loss": 1.4097, "step": 28413 }, { "epoch": 0.78, "learning_rate": 2.5187288178974144e-06, "loss": 1.262, "step": 28414 }, { "epoch": 0.78, "learning_rate": 2.5181419276071293e-06, "loss": 1.6797, "step": 28415 }, { "epoch": 0.78, "learning_rate": 2.517555095851384e-06, "loss": 1.167, "step": 28416 }, { "epoch": 0.78, "learning_rate": 2.5169683226347664e-06, "loss": 1.3279, "step": 28417 }, { "epoch": 0.78, "learning_rate": 2.516381607961872e-06, "loss": 1.1702, "step": 28418 }, { "epoch": 0.78, "learning_rate": 2.5157949518372892e-06, "loss": 1.119, "step": 28419 }, { "epoch": 0.78, "learning_rate": 2.515208354265608e-06, "loss": 1.2502, "step": 28420 }, { "epoch": 0.78, "learning_rate": 2.5146218152514134e-06, "loss": 1.3059, "step": 28421 }, { "epoch": 0.78, "learning_rate": 2.5140353347993006e-06, "loss": 1.2883, "step": 28422 }, { "epoch": 0.78, "learning_rate": 2.513448912913856e-06, "loss": 1.3281, "step": 28423 }, { "epoch": 0.78, "learning_rate": 2.512862549599666e-06, "loss": 1.2805, "step": 28424 }, { "epoch": 0.78, "learning_rate": 2.512276244861316e-06, "loss": 1.1379, "step": 28425 }, { "epoch": 0.78, "learning_rate": 2.511689998703398e-06, "loss": 1.2913, "step": 28426 }, { "epoch": 0.78, "learning_rate": 2.5111038111304976e-06, "loss": 1.1748, "step": 28427 }, { "epoch": 0.78, "learning_rate": 2.5105176821471956e-06, "loss": 1.2461, "step": 28428 }, { "epoch": 0.78, "learning_rate": 2.5099316117580842e-06, "loss": 1.4224, "step": 28429 }, { "epoch": 0.78, "learning_rate": 2.5093455999677463e-06, "loss": 1.2546, "step": 28430 }, { "epoch": 0.78, "learning_rate": 2.508759646780766e-06, "loss": 1.3235, "step": 28431 }, { "epoch": 0.78, "learning_rate": 2.5081737522017248e-06, "loss": 1.0974, "step": 28432 }, { "epoch": 0.78, "learning_rate": 2.5075879162352114e-06, "loss": 1.0581, "step": 28433 }, { "epoch": 0.78, "learning_rate": 2.5070021388858044e-06, "loss": 1.2612, "step": 28434 }, { "epoch": 0.78, "learning_rate": 2.5064164201580954e-06, "loss": 1.3472, "step": 28435 }, { "epoch": 0.78, "learning_rate": 2.5058307600566546e-06, "loss": 1.1475, "step": 28436 }, { "epoch": 0.78, "learning_rate": 2.505245158586074e-06, "loss": 1.2053, "step": 28437 }, { "epoch": 0.78, "learning_rate": 2.504659615750926e-06, "loss": 1.2991, "step": 28438 }, { "epoch": 0.78, "learning_rate": 2.5040741315558037e-06, "loss": 1.3628, "step": 28439 }, { "epoch": 0.78, "learning_rate": 2.5034887060052738e-06, "loss": 1.28, "step": 28440 }, { "epoch": 0.78, "learning_rate": 2.502903339103927e-06, "loss": 1.2434, "step": 28441 }, { "epoch": 0.78, "learning_rate": 2.5023180308563356e-06, "loss": 1.1238, "step": 28442 }, { "epoch": 0.78, "learning_rate": 2.501732781267089e-06, "loss": 1.1675, "step": 28443 }, { "epoch": 0.78, "learning_rate": 2.501147590340752e-06, "loss": 1.1873, "step": 28444 }, { "epoch": 0.78, "learning_rate": 2.500562458081911e-06, "loss": 1.0153, "step": 28445 }, { "epoch": 0.78, "learning_rate": 2.4999773844951457e-06, "loss": 1.2419, "step": 28446 }, { "epoch": 0.78, "learning_rate": 2.4993923695850307e-06, "loss": 1.1528, "step": 28447 }, { "epoch": 0.78, "learning_rate": 2.4988074133561424e-06, "loss": 1.3367, "step": 28448 }, { "epoch": 0.78, "learning_rate": 2.4982225158130548e-06, "loss": 1.3965, "step": 28449 }, { "epoch": 0.78, "learning_rate": 2.4976376769603493e-06, "loss": 1.2632, "step": 28450 }, { "epoch": 0.78, "learning_rate": 2.4970528968025985e-06, "loss": 1.3118, "step": 28451 }, { "epoch": 0.78, "learning_rate": 2.4964681753443786e-06, "loss": 1.0791, "step": 28452 }, { "epoch": 0.78, "learning_rate": 2.4958835125902604e-06, "loss": 1.3125, "step": 28453 }, { "epoch": 0.78, "learning_rate": 2.495298908544823e-06, "loss": 1.2112, "step": 28454 }, { "epoch": 0.78, "learning_rate": 2.494714363212638e-06, "loss": 1.1936, "step": 28455 }, { "epoch": 0.78, "learning_rate": 2.494129876598279e-06, "loss": 1.3, "step": 28456 }, { "epoch": 0.78, "learning_rate": 2.493545448706315e-06, "loss": 1.176, "step": 28457 }, { "epoch": 0.78, "learning_rate": 2.4929610795413253e-06, "loss": 1.3105, "step": 28458 }, { "epoch": 0.78, "learning_rate": 2.4923767691078772e-06, "loss": 1.2961, "step": 28459 }, { "epoch": 0.78, "learning_rate": 2.4917925174105406e-06, "loss": 1.3542, "step": 28460 }, { "epoch": 0.78, "learning_rate": 2.491208324453892e-06, "loss": 1.27, "step": 28461 }, { "epoch": 0.78, "learning_rate": 2.4906241902424977e-06, "loss": 1.1919, "step": 28462 }, { "epoch": 0.78, "learning_rate": 2.4900401147809296e-06, "loss": 1.2642, "step": 28463 }, { "epoch": 0.78, "learning_rate": 2.4894560980737527e-06, "loss": 1.1692, "step": 28464 }, { "epoch": 0.78, "learning_rate": 2.4888721401255423e-06, "loss": 1.1372, "step": 28465 }, { "epoch": 0.78, "learning_rate": 2.488288240940864e-06, "loss": 1.2485, "step": 28466 }, { "epoch": 0.78, "learning_rate": 2.487704400524287e-06, "loss": 1.217, "step": 28467 }, { "epoch": 0.78, "learning_rate": 2.4871206188803755e-06, "loss": 1.2498, "step": 28468 }, { "epoch": 0.78, "learning_rate": 2.4865368960137014e-06, "loss": 1.1414, "step": 28469 }, { "epoch": 0.78, "learning_rate": 2.4859532319288304e-06, "loss": 1.2122, "step": 28470 }, { "epoch": 0.78, "learning_rate": 2.4853696266303273e-06, "loss": 1.3518, "step": 28471 }, { "epoch": 0.78, "learning_rate": 2.4847860801227565e-06, "loss": 1.3225, "step": 28472 }, { "epoch": 0.78, "learning_rate": 2.4842025924106873e-06, "loss": 1.3169, "step": 28473 }, { "epoch": 0.78, "learning_rate": 2.483619163498684e-06, "loss": 1.1101, "step": 28474 }, { "epoch": 0.78, "learning_rate": 2.4830357933913063e-06, "loss": 1.3203, "step": 28475 }, { "epoch": 0.78, "learning_rate": 2.482452482093125e-06, "loss": 1.3152, "step": 28476 }, { "epoch": 0.78, "learning_rate": 2.4818692296086978e-06, "loss": 1.2625, "step": 28477 }, { "epoch": 0.78, "learning_rate": 2.481286035942595e-06, "loss": 1.1785, "step": 28478 }, { "epoch": 0.78, "learning_rate": 2.48070290109937e-06, "loss": 1.2671, "step": 28479 }, { "epoch": 0.78, "learning_rate": 2.4801198250835933e-06, "loss": 1.2009, "step": 28480 }, { "epoch": 0.78, "learning_rate": 2.4795368078998183e-06, "loss": 1.1123, "step": 28481 }, { "epoch": 0.78, "learning_rate": 2.478953849552618e-06, "loss": 1.2563, "step": 28482 }, { "epoch": 0.78, "learning_rate": 2.4783709500465404e-06, "loss": 1.2126, "step": 28483 }, { "epoch": 0.78, "learning_rate": 2.4777881093861545e-06, "loss": 1.22, "step": 28484 }, { "epoch": 0.78, "learning_rate": 2.4772053275760135e-06, "loss": 1.177, "step": 28485 }, { "epoch": 0.78, "learning_rate": 2.4766226046206867e-06, "loss": 1.0334, "step": 28486 }, { "epoch": 0.78, "learning_rate": 2.4760399405247214e-06, "loss": 1.3308, "step": 28487 }, { "epoch": 0.78, "learning_rate": 2.475457335292685e-06, "loss": 1.3479, "step": 28488 }, { "epoch": 0.78, "learning_rate": 2.474874788929128e-06, "loss": 1.2161, "step": 28489 }, { "epoch": 0.78, "learning_rate": 2.4742923014386154e-06, "loss": 1.7314, "step": 28490 }, { "epoch": 0.78, "learning_rate": 2.4737098728257012e-06, "loss": 1.2175, "step": 28491 }, { "epoch": 0.78, "learning_rate": 2.473127503094939e-06, "loss": 1.2842, "step": 28492 }, { "epoch": 0.78, "learning_rate": 2.4725451922508904e-06, "loss": 1.2214, "step": 28493 }, { "epoch": 0.78, "learning_rate": 2.471962940298108e-06, "loss": 1.3105, "step": 28494 }, { "epoch": 0.78, "learning_rate": 2.471380747241149e-06, "loss": 1.2334, "step": 28495 }, { "epoch": 0.78, "learning_rate": 2.4707986130845628e-06, "loss": 1.208, "step": 28496 }, { "epoch": 0.78, "learning_rate": 2.4702165378329115e-06, "loss": 1.2625, "step": 28497 }, { "epoch": 0.78, "learning_rate": 2.469634521490745e-06, "loss": 1.2334, "step": 28498 }, { "epoch": 0.78, "learning_rate": 2.4690525640626174e-06, "loss": 1.2473, "step": 28499 }, { "epoch": 0.78, "learning_rate": 2.4684706655530777e-06, "loss": 1.2163, "step": 28500 }, { "epoch": 0.78, "learning_rate": 2.4678888259666845e-06, "loss": 1.1541, "step": 28501 }, { "epoch": 0.78, "learning_rate": 2.4673070453079872e-06, "loss": 1.3137, "step": 28502 }, { "epoch": 0.78, "learning_rate": 2.466725323581539e-06, "loss": 1.3462, "step": 28503 }, { "epoch": 0.78, "learning_rate": 2.4661436607918856e-06, "loss": 1.2971, "step": 28504 }, { "epoch": 0.78, "learning_rate": 2.4655620569435847e-06, "loss": 1.2727, "step": 28505 }, { "epoch": 0.78, "learning_rate": 2.4649805120411816e-06, "loss": 1.2893, "step": 28506 }, { "epoch": 0.78, "learning_rate": 2.464399026089227e-06, "loss": 1.1985, "step": 28507 }, { "epoch": 0.78, "learning_rate": 2.463817599092273e-06, "loss": 1.2288, "step": 28508 }, { "epoch": 0.78, "learning_rate": 2.4632362310548664e-06, "loss": 1.1301, "step": 28509 }, { "epoch": 0.78, "learning_rate": 2.4626549219815553e-06, "loss": 1.2075, "step": 28510 }, { "epoch": 0.78, "learning_rate": 2.4620736718768858e-06, "loss": 1.2151, "step": 28511 }, { "epoch": 0.78, "learning_rate": 2.461492480745409e-06, "loss": 1.2922, "step": 28512 }, { "epoch": 0.78, "learning_rate": 2.4609113485916713e-06, "loss": 1.1646, "step": 28513 }, { "epoch": 0.78, "learning_rate": 2.4603302754202175e-06, "loss": 1.1318, "step": 28514 }, { "epoch": 0.78, "learning_rate": 2.459749261235591e-06, "loss": 1.2432, "step": 28515 }, { "epoch": 0.78, "learning_rate": 2.4591683060423446e-06, "loss": 1.1194, "step": 28516 }, { "epoch": 0.78, "learning_rate": 2.458587409845018e-06, "loss": 1.2493, "step": 28517 }, { "epoch": 0.78, "learning_rate": 2.4580065726481582e-06, "loss": 1.1528, "step": 28518 }, { "epoch": 0.78, "learning_rate": 2.4574257944563053e-06, "loss": 1.2522, "step": 28519 }, { "epoch": 0.78, "learning_rate": 2.4568450752740093e-06, "loss": 1.2256, "step": 28520 }, { "epoch": 0.78, "learning_rate": 2.45626441510581e-06, "loss": 1.3184, "step": 28521 }, { "epoch": 0.78, "learning_rate": 2.4556838139562478e-06, "loss": 1.4209, "step": 28522 }, { "epoch": 0.78, "learning_rate": 2.4551032718298705e-06, "loss": 1.4097, "step": 28523 }, { "epoch": 0.78, "learning_rate": 2.454522788731215e-06, "loss": 1.1934, "step": 28524 }, { "epoch": 0.78, "learning_rate": 2.453942364664831e-06, "loss": 1.1633, "step": 28525 }, { "epoch": 0.78, "learning_rate": 2.4533619996352476e-06, "loss": 1.168, "step": 28526 }, { "epoch": 0.78, "learning_rate": 2.4527816936470138e-06, "loss": 1.2542, "step": 28527 }, { "epoch": 0.78, "learning_rate": 2.452201446704664e-06, "loss": 1.3496, "step": 28528 }, { "epoch": 0.78, "learning_rate": 2.4516212588127474e-06, "loss": 1.2095, "step": 28529 }, { "epoch": 0.78, "learning_rate": 2.4510411299757895e-06, "loss": 1.2705, "step": 28530 }, { "epoch": 0.78, "learning_rate": 2.4504610601983402e-06, "loss": 1.3391, "step": 28531 }, { "epoch": 0.78, "learning_rate": 2.44988104948493e-06, "loss": 1.1465, "step": 28532 }, { "epoch": 0.78, "learning_rate": 2.449301097840107e-06, "loss": 1.2627, "step": 28533 }, { "epoch": 0.78, "learning_rate": 2.448721205268395e-06, "loss": 1.3032, "step": 28534 }, { "epoch": 0.78, "learning_rate": 2.4481413717743395e-06, "loss": 1.3862, "step": 28535 }, { "epoch": 0.78, "learning_rate": 2.4475615973624734e-06, "loss": 1.2812, "step": 28536 }, { "epoch": 0.78, "learning_rate": 2.4469818820373357e-06, "loss": 1.2603, "step": 28537 }, { "epoch": 0.78, "learning_rate": 2.44640222580346e-06, "loss": 1.7778, "step": 28538 }, { "epoch": 0.78, "learning_rate": 2.44582262866538e-06, "loss": 1.2354, "step": 28539 }, { "epoch": 0.78, "learning_rate": 2.4452430906276338e-06, "loss": 1.0522, "step": 28540 }, { "epoch": 0.78, "learning_rate": 2.444663611694752e-06, "loss": 1.1951, "step": 28541 }, { "epoch": 0.78, "learning_rate": 2.44408419187127e-06, "loss": 1.3506, "step": 28542 }, { "epoch": 0.78, "learning_rate": 2.443504831161717e-06, "loss": 1.3784, "step": 28543 }, { "epoch": 0.78, "learning_rate": 2.4429255295706335e-06, "loss": 1.1101, "step": 28544 }, { "epoch": 0.78, "learning_rate": 2.442346287102545e-06, "loss": 1.2107, "step": 28545 }, { "epoch": 0.78, "learning_rate": 2.441767103761986e-06, "loss": 1.2644, "step": 28546 }, { "epoch": 0.78, "learning_rate": 2.4411879795534845e-06, "loss": 1.2405, "step": 28547 }, { "epoch": 0.78, "learning_rate": 2.440608914481576e-06, "loss": 1.178, "step": 28548 }, { "epoch": 0.78, "learning_rate": 2.4400299085507895e-06, "loss": 1.2715, "step": 28549 }, { "epoch": 0.78, "learning_rate": 2.439450961765654e-06, "loss": 1.2644, "step": 28550 }, { "epoch": 0.78, "learning_rate": 2.438872074130696e-06, "loss": 1.1567, "step": 28551 }, { "epoch": 0.78, "learning_rate": 2.4382932456504493e-06, "loss": 1.2725, "step": 28552 }, { "epoch": 0.78, "learning_rate": 2.437714476329441e-06, "loss": 1.2949, "step": 28553 }, { "epoch": 0.78, "learning_rate": 2.437135766172196e-06, "loss": 1.181, "step": 28554 }, { "epoch": 0.78, "learning_rate": 2.436557115183248e-06, "loss": 1.3401, "step": 28555 }, { "epoch": 0.78, "learning_rate": 2.4359785233671195e-06, "loss": 1.4719, "step": 28556 }, { "epoch": 0.78, "learning_rate": 2.435399990728339e-06, "loss": 1.1692, "step": 28557 }, { "epoch": 0.78, "learning_rate": 2.4348215172714283e-06, "loss": 1.2686, "step": 28558 }, { "epoch": 0.78, "learning_rate": 2.4342431030009196e-06, "loss": 1.27, "step": 28559 }, { "epoch": 0.78, "learning_rate": 2.433664747921335e-06, "loss": 1.3162, "step": 28560 }, { "epoch": 0.78, "learning_rate": 2.4330864520372e-06, "loss": 1.3044, "step": 28561 }, { "epoch": 0.78, "learning_rate": 2.4325082153530355e-06, "loss": 1.2625, "step": 28562 }, { "epoch": 0.78, "learning_rate": 2.43193003787337e-06, "loss": 1.4082, "step": 28563 }, { "epoch": 0.78, "learning_rate": 2.431351919602727e-06, "loss": 1.1208, "step": 28564 }, { "epoch": 0.78, "learning_rate": 2.4307738605456266e-06, "loss": 1.27, "step": 28565 }, { "epoch": 0.78, "learning_rate": 2.430195860706589e-06, "loss": 1.2617, "step": 28566 }, { "epoch": 0.78, "learning_rate": 2.4296179200901427e-06, "loss": 1.1272, "step": 28567 }, { "epoch": 0.78, "learning_rate": 2.429040038700806e-06, "loss": 1.2791, "step": 28568 }, { "epoch": 0.78, "learning_rate": 2.428462216543097e-06, "loss": 1.2915, "step": 28569 }, { "epoch": 0.78, "learning_rate": 2.4278844536215417e-06, "loss": 1.2458, "step": 28570 }, { "epoch": 0.78, "learning_rate": 2.4273067499406553e-06, "loss": 1.2017, "step": 28571 }, { "epoch": 0.78, "learning_rate": 2.426729105504966e-06, "loss": 1.3879, "step": 28572 }, { "epoch": 0.78, "learning_rate": 2.42615152031898e-06, "loss": 1.0674, "step": 28573 }, { "epoch": 0.78, "learning_rate": 2.425573994387227e-06, "loss": 1.2446, "step": 28574 }, { "epoch": 0.78, "learning_rate": 2.4249965277142185e-06, "loss": 1.2439, "step": 28575 }, { "epoch": 0.78, "learning_rate": 2.4244191203044807e-06, "loss": 0.936, "step": 28576 }, { "epoch": 0.78, "learning_rate": 2.4238417721625197e-06, "loss": 1.1921, "step": 28577 }, { "epoch": 0.78, "learning_rate": 2.423264483292861e-06, "loss": 1.1689, "step": 28578 }, { "epoch": 0.78, "learning_rate": 2.4226872537000146e-06, "loss": 1.1592, "step": 28579 }, { "epoch": 0.78, "learning_rate": 2.422110083388506e-06, "loss": 1.1904, "step": 28580 }, { "epoch": 0.78, "learning_rate": 2.42153297236284e-06, "loss": 1.4094, "step": 28581 }, { "epoch": 0.78, "learning_rate": 2.420955920627538e-06, "loss": 1.1677, "step": 28582 }, { "epoch": 0.78, "learning_rate": 2.4203789281871104e-06, "loss": 1.2224, "step": 28583 }, { "epoch": 0.78, "learning_rate": 2.419801995046077e-06, "loss": 1.2275, "step": 28584 }, { "epoch": 0.78, "learning_rate": 2.419225121208949e-06, "loss": 1.2744, "step": 28585 }, { "epoch": 0.78, "learning_rate": 2.4186483066802345e-06, "loss": 1.2979, "step": 28586 }, { "epoch": 0.78, "learning_rate": 2.418071551464455e-06, "loss": 1.155, "step": 28587 }, { "epoch": 0.78, "learning_rate": 2.417494855566118e-06, "loss": 1.2896, "step": 28588 }, { "epoch": 0.78, "learning_rate": 2.4169182189897355e-06, "loss": 1.3188, "step": 28589 }, { "epoch": 0.78, "learning_rate": 2.4163416417398157e-06, "loss": 1.2336, "step": 28590 }, { "epoch": 0.78, "learning_rate": 2.4157651238208766e-06, "loss": 1.2698, "step": 28591 }, { "epoch": 0.78, "learning_rate": 2.4151886652374246e-06, "loss": 1.2324, "step": 28592 }, { "epoch": 0.78, "learning_rate": 2.4146122659939687e-06, "loss": 1.2861, "step": 28593 }, { "epoch": 0.78, "learning_rate": 2.4140359260950174e-06, "loss": 1.3083, "step": 28594 }, { "epoch": 0.78, "learning_rate": 2.4134596455450855e-06, "loss": 1.3857, "step": 28595 }, { "epoch": 0.78, "learning_rate": 2.4128834243486775e-06, "loss": 1.2288, "step": 28596 }, { "epoch": 0.78, "learning_rate": 2.412307262510302e-06, "loss": 1.4316, "step": 28597 }, { "epoch": 0.78, "learning_rate": 2.411731160034463e-06, "loss": 1.2749, "step": 28598 }, { "epoch": 0.78, "learning_rate": 2.411155116925674e-06, "loss": 1.2769, "step": 28599 }, { "epoch": 0.78, "learning_rate": 2.410579133188439e-06, "loss": 1.6602, "step": 28600 }, { "epoch": 0.78, "learning_rate": 2.410003208827262e-06, "loss": 1.7012, "step": 28601 }, { "epoch": 0.78, "learning_rate": 2.409427343846652e-06, "loss": 1.4272, "step": 28602 }, { "epoch": 0.78, "learning_rate": 2.4088515382511145e-06, "loss": 1.165, "step": 28603 }, { "epoch": 0.78, "learning_rate": 2.4082757920451525e-06, "loss": 1.2085, "step": 28604 }, { "epoch": 0.78, "learning_rate": 2.4077001052332683e-06, "loss": 1.2466, "step": 28605 }, { "epoch": 0.78, "learning_rate": 2.407124477819971e-06, "loss": 1.3445, "step": 28606 }, { "epoch": 0.78, "learning_rate": 2.406548909809762e-06, "loss": 1.2754, "step": 28607 }, { "epoch": 0.78, "learning_rate": 2.4059734012071422e-06, "loss": 1.3354, "step": 28608 }, { "epoch": 0.78, "learning_rate": 2.4053979520166138e-06, "loss": 1.1475, "step": 28609 }, { "epoch": 0.78, "learning_rate": 2.4048225622426823e-06, "loss": 1.1929, "step": 28610 }, { "epoch": 0.78, "learning_rate": 2.404247231889849e-06, "loss": 1.7139, "step": 28611 }, { "epoch": 0.78, "learning_rate": 2.4036719609626126e-06, "loss": 1.126, "step": 28612 }, { "epoch": 0.78, "learning_rate": 2.4030967494654724e-06, "loss": 1.1929, "step": 28613 }, { "epoch": 0.78, "learning_rate": 2.4025215974029304e-06, "loss": 1.2694, "step": 28614 }, { "epoch": 0.78, "learning_rate": 2.401946504779493e-06, "loss": 1.3923, "step": 28615 }, { "epoch": 0.78, "learning_rate": 2.401371471599647e-06, "loss": 1.2842, "step": 28616 }, { "epoch": 0.78, "learning_rate": 2.400796497867901e-06, "loss": 1.6865, "step": 28617 }, { "epoch": 0.78, "learning_rate": 2.4002215835887467e-06, "loss": 1.6562, "step": 28618 }, { "epoch": 0.78, "learning_rate": 2.3996467287666914e-06, "loss": 1.3306, "step": 28619 }, { "epoch": 0.78, "learning_rate": 2.3990719334062194e-06, "loss": 1.1943, "step": 28620 }, { "epoch": 0.78, "learning_rate": 2.3984971975118378e-06, "loss": 1.2195, "step": 28621 }, { "epoch": 0.78, "learning_rate": 2.397922521088036e-06, "loss": 1.3716, "step": 28622 }, { "epoch": 0.78, "learning_rate": 2.397347904139321e-06, "loss": 1.7241, "step": 28623 }, { "epoch": 0.78, "learning_rate": 2.396773346670174e-06, "loss": 1.3745, "step": 28624 }, { "epoch": 0.78, "learning_rate": 2.3961988486851007e-06, "loss": 1.125, "step": 28625 }, { "epoch": 0.78, "learning_rate": 2.3956244101885883e-06, "loss": 1.3069, "step": 28626 }, { "epoch": 0.78, "learning_rate": 2.395050031185141e-06, "loss": 1.2825, "step": 28627 }, { "epoch": 0.78, "learning_rate": 2.3944757116792406e-06, "loss": 1.2188, "step": 28628 }, { "epoch": 0.78, "learning_rate": 2.3939014516753876e-06, "loss": 1.2202, "step": 28629 }, { "epoch": 0.78, "learning_rate": 2.3933272511780716e-06, "loss": 1.2878, "step": 28630 }, { "epoch": 0.78, "learning_rate": 2.392753110191788e-06, "loss": 1.3645, "step": 28631 }, { "epoch": 0.78, "learning_rate": 2.392179028721028e-06, "loss": 1.7017, "step": 28632 }, { "epoch": 0.78, "learning_rate": 2.391605006770278e-06, "loss": 1.123, "step": 28633 }, { "epoch": 0.78, "learning_rate": 2.3910310443440356e-06, "loss": 1.29, "step": 28634 }, { "epoch": 0.78, "learning_rate": 2.3904571414467892e-06, "loss": 1.1665, "step": 28635 }, { "epoch": 0.78, "learning_rate": 2.3898832980830265e-06, "loss": 1.3118, "step": 28636 }, { "epoch": 0.78, "learning_rate": 2.3893095142572364e-06, "loss": 1.2974, "step": 28637 }, { "epoch": 0.78, "learning_rate": 2.3887357899739128e-06, "loss": 1.1755, "step": 28638 }, { "epoch": 0.78, "learning_rate": 2.388162125237541e-06, "loss": 1.3215, "step": 28639 }, { "epoch": 0.78, "learning_rate": 2.3875885200526093e-06, "loss": 1.3403, "step": 28640 }, { "epoch": 0.78, "learning_rate": 2.3870149744236025e-06, "loss": 1.2408, "step": 28641 }, { "epoch": 0.78, "learning_rate": 2.3864414883550147e-06, "loss": 1.3499, "step": 28642 }, { "epoch": 0.78, "learning_rate": 2.3858680618513274e-06, "loss": 1.3435, "step": 28643 }, { "epoch": 0.78, "learning_rate": 2.3852946949170274e-06, "loss": 1.1572, "step": 28644 }, { "epoch": 0.78, "learning_rate": 2.3847213875566e-06, "loss": 1.187, "step": 28645 }, { "epoch": 0.78, "learning_rate": 2.3841481397745324e-06, "loss": 1.4612, "step": 28646 }, { "epoch": 0.78, "learning_rate": 2.3835749515753105e-06, "loss": 1.2068, "step": 28647 }, { "epoch": 0.78, "learning_rate": 2.3830018229634122e-06, "loss": 1.1687, "step": 28648 }, { "epoch": 0.78, "learning_rate": 2.382428753943329e-06, "loss": 1.1584, "step": 28649 }, { "epoch": 0.78, "learning_rate": 2.381855744519541e-06, "loss": 1.3516, "step": 28650 }, { "epoch": 0.78, "learning_rate": 2.381282794696532e-06, "loss": 1.1782, "step": 28651 }, { "epoch": 0.78, "learning_rate": 2.380709904478782e-06, "loss": 1.1689, "step": 28652 }, { "epoch": 0.78, "learning_rate": 2.380137073870776e-06, "loss": 1.1474, "step": 28653 }, { "epoch": 0.78, "learning_rate": 2.3795643028769946e-06, "loss": 1.2781, "step": 28654 }, { "epoch": 0.78, "learning_rate": 2.3789915915019192e-06, "loss": 1.4185, "step": 28655 }, { "epoch": 0.78, "learning_rate": 2.3784189397500267e-06, "loss": 1.178, "step": 28656 }, { "epoch": 0.78, "learning_rate": 2.377846347625804e-06, "loss": 1.187, "step": 28657 }, { "epoch": 0.78, "learning_rate": 2.377273815133727e-06, "loss": 1.1635, "step": 28658 }, { "epoch": 0.78, "learning_rate": 2.376701342278275e-06, "loss": 1.2815, "step": 28659 }, { "epoch": 0.78, "learning_rate": 2.3761289290639245e-06, "loss": 1.3315, "step": 28660 }, { "epoch": 0.78, "learning_rate": 2.375556575495156e-06, "loss": 1.2913, "step": 28661 }, { "epoch": 0.78, "learning_rate": 2.37498428157645e-06, "loss": 1.3887, "step": 28662 }, { "epoch": 0.78, "learning_rate": 2.3744120473122823e-06, "loss": 1.28, "step": 28663 }, { "epoch": 0.78, "learning_rate": 2.3738398727071288e-06, "loss": 1.2002, "step": 28664 }, { "epoch": 0.78, "learning_rate": 2.373267757765463e-06, "loss": 1.1362, "step": 28665 }, { "epoch": 0.78, "learning_rate": 2.372695702491766e-06, "loss": 1.2385, "step": 28666 }, { "epoch": 0.78, "learning_rate": 2.3721237068905124e-06, "loss": 1.4048, "step": 28667 }, { "epoch": 0.78, "learning_rate": 2.371551770966175e-06, "loss": 1.2344, "step": 28668 }, { "epoch": 0.78, "learning_rate": 2.3709798947232276e-06, "loss": 1.3269, "step": 28669 }, { "epoch": 0.78, "learning_rate": 2.3704080781661486e-06, "loss": 1.3054, "step": 28670 }, { "epoch": 0.78, "learning_rate": 2.3698363212994093e-06, "loss": 1.2466, "step": 28671 }, { "epoch": 0.78, "learning_rate": 2.3692646241274818e-06, "loss": 1.2473, "step": 28672 }, { "epoch": 0.78, "learning_rate": 2.368692986654837e-06, "loss": 1.3076, "step": 28673 }, { "epoch": 0.78, "learning_rate": 2.368121408885953e-06, "loss": 1.3047, "step": 28674 }, { "epoch": 0.78, "learning_rate": 2.367549890825298e-06, "loss": 1.2043, "step": 28675 }, { "epoch": 0.78, "learning_rate": 2.3669784324773417e-06, "loss": 1.1399, "step": 28676 }, { "epoch": 0.78, "learning_rate": 2.3664070338465585e-06, "loss": 1.2292, "step": 28677 }, { "epoch": 0.78, "learning_rate": 2.3658356949374185e-06, "loss": 1.3049, "step": 28678 }, { "epoch": 0.78, "learning_rate": 2.365264415754389e-06, "loss": 1.1836, "step": 28679 }, { "epoch": 0.78, "learning_rate": 2.3646931963019383e-06, "loss": 1.1366, "step": 28680 }, { "epoch": 0.78, "learning_rate": 2.36412203658454e-06, "loss": 1.2759, "step": 28681 }, { "epoch": 0.78, "learning_rate": 2.36355093660666e-06, "loss": 1.3848, "step": 28682 }, { "epoch": 0.78, "learning_rate": 2.3629798963727678e-06, "loss": 1.2939, "step": 28683 }, { "epoch": 0.78, "learning_rate": 2.3624089158873266e-06, "loss": 1.2244, "step": 28684 }, { "epoch": 0.78, "learning_rate": 2.3618379951548087e-06, "loss": 1.2524, "step": 28685 }, { "epoch": 0.78, "learning_rate": 2.3612671341796787e-06, "loss": 1.3364, "step": 28686 }, { "epoch": 0.78, "learning_rate": 2.3606963329664023e-06, "loss": 1.1973, "step": 28687 }, { "epoch": 0.78, "learning_rate": 2.3601255915194432e-06, "loss": 1.3835, "step": 28688 }, { "epoch": 0.78, "learning_rate": 2.3595549098432726e-06, "loss": 1.2573, "step": 28689 }, { "epoch": 0.78, "learning_rate": 2.358984287942351e-06, "loss": 1.134, "step": 28690 }, { "epoch": 0.78, "learning_rate": 2.3584137258211424e-06, "loss": 1.7144, "step": 28691 }, { "epoch": 0.78, "learning_rate": 2.3578432234841097e-06, "loss": 1.291, "step": 28692 }, { "epoch": 0.78, "learning_rate": 2.357272780935721e-06, "loss": 1.2344, "step": 28693 }, { "epoch": 0.78, "learning_rate": 2.356702398180435e-06, "loss": 1.3494, "step": 28694 }, { "epoch": 0.78, "learning_rate": 2.3561320752227135e-06, "loss": 1.4324, "step": 28695 }, { "epoch": 0.78, "learning_rate": 2.355561812067023e-06, "loss": 1.2078, "step": 28696 }, { "epoch": 0.78, "learning_rate": 2.3549916087178193e-06, "loss": 1.3105, "step": 28697 }, { "epoch": 0.78, "learning_rate": 2.3544214651795715e-06, "loss": 1.3281, "step": 28698 }, { "epoch": 0.78, "learning_rate": 2.35385138145673e-06, "loss": 1.3049, "step": 28699 }, { "epoch": 0.78, "learning_rate": 2.3532813575537618e-06, "loss": 1.2358, "step": 28700 }, { "epoch": 0.78, "learning_rate": 2.352711393475122e-06, "loss": 1.1687, "step": 28701 }, { "epoch": 0.78, "learning_rate": 2.352141489225278e-06, "loss": 1.2097, "step": 28702 }, { "epoch": 0.78, "learning_rate": 2.3515716448086777e-06, "loss": 1.3206, "step": 28703 }, { "epoch": 0.78, "learning_rate": 2.351001860229787e-06, "loss": 1.2974, "step": 28704 }, { "epoch": 0.78, "learning_rate": 2.3504321354930572e-06, "loss": 1.377, "step": 28705 }, { "epoch": 0.78, "learning_rate": 2.349862470602956e-06, "loss": 1.2502, "step": 28706 }, { "epoch": 0.78, "learning_rate": 2.349292865563927e-06, "loss": 1.1565, "step": 28707 }, { "epoch": 0.78, "learning_rate": 2.3487233203804325e-06, "loss": 1.4131, "step": 28708 }, { "epoch": 0.78, "learning_rate": 2.3481538350569335e-06, "loss": 1.1001, "step": 28709 }, { "epoch": 0.78, "learning_rate": 2.3475844095978793e-06, "loss": 1.2124, "step": 28710 }, { "epoch": 0.78, "learning_rate": 2.3470150440077267e-06, "loss": 1.0974, "step": 28711 }, { "epoch": 0.78, "learning_rate": 2.346445738290927e-06, "loss": 1.2161, "step": 28712 }, { "epoch": 0.78, "learning_rate": 2.3458764924519396e-06, "loss": 1.7295, "step": 28713 }, { "epoch": 0.78, "learning_rate": 2.3453073064952147e-06, "loss": 1.2637, "step": 28714 }, { "epoch": 0.78, "learning_rate": 2.344738180425207e-06, "loss": 1.1821, "step": 28715 }, { "epoch": 0.78, "learning_rate": 2.344169114246364e-06, "loss": 1.3328, "step": 28716 }, { "epoch": 0.78, "learning_rate": 2.3436001079631455e-06, "loss": 1.3015, "step": 28717 }, { "epoch": 0.78, "learning_rate": 2.3430311615799996e-06, "loss": 1.3987, "step": 28718 }, { "epoch": 0.78, "learning_rate": 2.342462275101377e-06, "loss": 1.1689, "step": 28719 }, { "epoch": 0.78, "learning_rate": 2.3418934485317257e-06, "loss": 1.3499, "step": 28720 }, { "epoch": 0.78, "learning_rate": 2.341324681875502e-06, "loss": 1.1162, "step": 28721 }, { "epoch": 0.78, "learning_rate": 2.3407559751371534e-06, "loss": 1.2148, "step": 28722 }, { "epoch": 0.78, "learning_rate": 2.340187328321124e-06, "loss": 1.2954, "step": 28723 }, { "epoch": 0.78, "learning_rate": 2.3396187414318717e-06, "loss": 1.2996, "step": 28724 }, { "epoch": 0.78, "learning_rate": 2.3390502144738393e-06, "loss": 1.3525, "step": 28725 }, { "epoch": 0.78, "learning_rate": 2.3384817474514754e-06, "loss": 1.2136, "step": 28726 }, { "epoch": 0.78, "learning_rate": 2.3379133403692244e-06, "loss": 1.1877, "step": 28727 }, { "epoch": 0.78, "learning_rate": 2.3373449932315395e-06, "loss": 1.2666, "step": 28728 }, { "epoch": 0.78, "learning_rate": 2.3367767060428647e-06, "loss": 1.2087, "step": 28729 }, { "epoch": 0.78, "learning_rate": 2.3362084788076457e-06, "loss": 1.2407, "step": 28730 }, { "epoch": 0.78, "learning_rate": 2.335640311530324e-06, "loss": 1.2759, "step": 28731 }, { "epoch": 0.78, "learning_rate": 2.3350722042153516e-06, "loss": 1.175, "step": 28732 }, { "epoch": 0.78, "learning_rate": 2.33450415686717e-06, "loss": 1.3135, "step": 28733 }, { "epoch": 0.78, "learning_rate": 2.333936169490224e-06, "loss": 1.3176, "step": 28734 }, { "epoch": 0.78, "learning_rate": 2.3333682420889526e-06, "loss": 1.3479, "step": 28735 }, { "epoch": 0.78, "learning_rate": 2.332800374667806e-06, "loss": 1.3464, "step": 28736 }, { "epoch": 0.78, "learning_rate": 2.332232567231225e-06, "loss": 1.2478, "step": 28737 }, { "epoch": 0.78, "learning_rate": 2.3316648197836465e-06, "loss": 1.2849, "step": 28738 }, { "epoch": 0.78, "learning_rate": 2.3310971323295206e-06, "loss": 1.2544, "step": 28739 }, { "epoch": 0.78, "learning_rate": 2.330529504873281e-06, "loss": 1.2144, "step": 28740 }, { "epoch": 0.78, "learning_rate": 2.3299619374193783e-06, "loss": 1.3506, "step": 28741 }, { "epoch": 0.78, "learning_rate": 2.3293944299722406e-06, "loss": 1.312, "step": 28742 }, { "epoch": 0.78, "learning_rate": 2.3288269825363174e-06, "loss": 1.3035, "step": 28743 }, { "epoch": 0.78, "learning_rate": 2.3282595951160413e-06, "loss": 1.4075, "step": 28744 }, { "epoch": 0.79, "learning_rate": 2.32769226771586e-06, "loss": 1.0942, "step": 28745 }, { "epoch": 0.79, "learning_rate": 2.3271250003402012e-06, "loss": 1.0786, "step": 28746 }, { "epoch": 0.79, "learning_rate": 2.3265577929935113e-06, "loss": 1.3584, "step": 28747 }, { "epoch": 0.79, "learning_rate": 2.3259906456802218e-06, "loss": 1.1938, "step": 28748 }, { "epoch": 0.79, "learning_rate": 2.325423558404779e-06, "loss": 1.3101, "step": 28749 }, { "epoch": 0.79, "learning_rate": 2.3248565311716075e-06, "loss": 1.2446, "step": 28750 }, { "epoch": 0.79, "learning_rate": 2.3242895639851517e-06, "loss": 1.1558, "step": 28751 }, { "epoch": 0.79, "learning_rate": 2.323722656849843e-06, "loss": 1.2812, "step": 28752 }, { "epoch": 0.79, "learning_rate": 2.3231558097701246e-06, "loss": 1.6582, "step": 28753 }, { "epoch": 0.79, "learning_rate": 2.322589022750419e-06, "loss": 1.46, "step": 28754 }, { "epoch": 0.79, "learning_rate": 2.3220222957951666e-06, "loss": 1.1436, "step": 28755 }, { "epoch": 0.79, "learning_rate": 2.321455628908804e-06, "loss": 1.3132, "step": 28756 }, { "epoch": 0.79, "learning_rate": 2.3208890220957616e-06, "loss": 1.707, "step": 28757 }, { "epoch": 0.79, "learning_rate": 2.3203224753604734e-06, "loss": 1.1309, "step": 28758 }, { "epoch": 0.79, "learning_rate": 2.319755988707367e-06, "loss": 1.1885, "step": 28759 }, { "epoch": 0.79, "learning_rate": 2.319189562140882e-06, "loss": 1.1797, "step": 28760 }, { "epoch": 0.79, "learning_rate": 2.318623195665446e-06, "loss": 1.2256, "step": 28761 }, { "epoch": 0.79, "learning_rate": 2.3180568892854904e-06, "loss": 1.3784, "step": 28762 }, { "epoch": 0.79, "learning_rate": 2.3174906430054412e-06, "loss": 1.3713, "step": 28763 }, { "epoch": 0.79, "learning_rate": 2.3169244568297365e-06, "loss": 1.3813, "step": 28764 }, { "epoch": 0.79, "learning_rate": 2.3163583307628025e-06, "loss": 1.2145, "step": 28765 }, { "epoch": 0.79, "learning_rate": 2.315792264809067e-06, "loss": 1.2507, "step": 28766 }, { "epoch": 0.79, "learning_rate": 2.3152262589729567e-06, "loss": 1.2075, "step": 28767 }, { "epoch": 0.79, "learning_rate": 2.3146603132589053e-06, "loss": 1.2603, "step": 28768 }, { "epoch": 0.79, "learning_rate": 2.314094427671338e-06, "loss": 1.4639, "step": 28769 }, { "epoch": 0.79, "learning_rate": 2.3135286022146785e-06, "loss": 1.1819, "step": 28770 }, { "epoch": 0.79, "learning_rate": 2.3129628368933597e-06, "loss": 1.2397, "step": 28771 }, { "epoch": 0.79, "learning_rate": 2.3123971317118054e-06, "loss": 1.3757, "step": 28772 }, { "epoch": 0.79, "learning_rate": 2.3118314866744408e-06, "loss": 1.1023, "step": 28773 }, { "epoch": 0.79, "learning_rate": 2.3112659017856888e-06, "loss": 1.6836, "step": 28774 }, { "epoch": 0.79, "learning_rate": 2.3107003770499793e-06, "loss": 1.2925, "step": 28775 }, { "epoch": 0.79, "learning_rate": 2.3101349124717344e-06, "loss": 1.3853, "step": 28776 }, { "epoch": 0.79, "learning_rate": 2.309569508055378e-06, "loss": 0.9609, "step": 28777 }, { "epoch": 0.79, "learning_rate": 2.3090041638053308e-06, "loss": 1.1831, "step": 28778 }, { "epoch": 0.79, "learning_rate": 2.3084388797260206e-06, "loss": 1.2097, "step": 28779 }, { "epoch": 0.79, "learning_rate": 2.3078736558218682e-06, "loss": 1.197, "step": 28780 }, { "epoch": 0.79, "learning_rate": 2.3073084920972955e-06, "loss": 1.1467, "step": 28781 }, { "epoch": 0.79, "learning_rate": 2.30674338855672e-06, "loss": 1.261, "step": 28782 }, { "epoch": 0.79, "learning_rate": 2.3061783452045705e-06, "loss": 1.6997, "step": 28783 }, { "epoch": 0.79, "learning_rate": 2.3056133620452637e-06, "loss": 1.2061, "step": 28784 }, { "epoch": 0.79, "learning_rate": 2.3050484390832163e-06, "loss": 1.2104, "step": 28785 }, { "epoch": 0.79, "learning_rate": 2.3044835763228545e-06, "loss": 1.3445, "step": 28786 }, { "epoch": 0.79, "learning_rate": 2.303918773768592e-06, "loss": 1.2383, "step": 28787 }, { "epoch": 0.79, "learning_rate": 2.303354031424856e-06, "loss": 1.217, "step": 28788 }, { "epoch": 0.79, "learning_rate": 2.302789349296053e-06, "loss": 1.6812, "step": 28789 }, { "epoch": 0.79, "learning_rate": 2.3022247273866093e-06, "loss": 1.3013, "step": 28790 }, { "epoch": 0.79, "learning_rate": 2.3016601657009364e-06, "loss": 1.3489, "step": 28791 }, { "epoch": 0.79, "learning_rate": 2.30109566424346e-06, "loss": 1.1013, "step": 28792 }, { "epoch": 0.79, "learning_rate": 2.300531223018586e-06, "loss": 1.3037, "step": 28793 }, { "epoch": 0.79, "learning_rate": 2.2999668420307373e-06, "loss": 1.2844, "step": 28794 }, { "epoch": 0.79, "learning_rate": 2.2994025212843253e-06, "loss": 1.2466, "step": 28795 }, { "epoch": 0.79, "learning_rate": 2.2988382607837712e-06, "loss": 1.3308, "step": 28796 }, { "epoch": 0.79, "learning_rate": 2.298274060533481e-06, "loss": 1.2578, "step": 28797 }, { "epoch": 0.79, "learning_rate": 2.297709920537874e-06, "loss": 1.2737, "step": 28798 }, { "epoch": 0.79, "learning_rate": 2.297145840801361e-06, "loss": 1.4424, "step": 28799 }, { "epoch": 0.79, "learning_rate": 2.2965818213283597e-06, "loss": 1.4795, "step": 28800 }, { "epoch": 0.79, "learning_rate": 2.2960178621232796e-06, "loss": 1.1479, "step": 28801 }, { "epoch": 0.79, "learning_rate": 2.29545396319053e-06, "loss": 1.1782, "step": 28802 }, { "epoch": 0.79, "learning_rate": 2.294890124534529e-06, "loss": 1.354, "step": 28803 }, { "epoch": 0.79, "learning_rate": 2.294326346159684e-06, "loss": 1.2512, "step": 28804 }, { "epoch": 0.79, "learning_rate": 2.293762628070406e-06, "loss": 1.1946, "step": 28805 }, { "epoch": 0.79, "learning_rate": 2.2931989702711033e-06, "loss": 1.1895, "step": 28806 }, { "epoch": 0.79, "learning_rate": 2.292635372766191e-06, "loss": 1.1038, "step": 28807 }, { "epoch": 0.79, "learning_rate": 2.2920718355600748e-06, "loss": 1.2898, "step": 28808 }, { "epoch": 0.79, "learning_rate": 2.291508358657164e-06, "loss": 1.2158, "step": 28809 }, { "epoch": 0.79, "learning_rate": 2.2909449420618636e-06, "loss": 1.291, "step": 28810 }, { "epoch": 0.79, "learning_rate": 2.290381585778588e-06, "loss": 1.2046, "step": 28811 }, { "epoch": 0.79, "learning_rate": 2.289818289811743e-06, "loss": 1.0994, "step": 28812 }, { "epoch": 0.79, "learning_rate": 2.2892550541657322e-06, "loss": 1.2734, "step": 28813 }, { "epoch": 0.79, "learning_rate": 2.2886918788449617e-06, "loss": 1.2527, "step": 28814 }, { "epoch": 0.79, "learning_rate": 2.288128763853844e-06, "loss": 1.4124, "step": 28815 }, { "epoch": 0.79, "learning_rate": 2.2875657091967784e-06, "loss": 1.1584, "step": 28816 }, { "epoch": 0.79, "learning_rate": 2.2870027148781705e-06, "loss": 1.2852, "step": 28817 }, { "epoch": 0.79, "learning_rate": 2.28643978090243e-06, "loss": 1.0121, "step": 28818 }, { "epoch": 0.79, "learning_rate": 2.285876907273956e-06, "loss": 1.3115, "step": 28819 }, { "epoch": 0.79, "learning_rate": 2.285314093997154e-06, "loss": 1.2461, "step": 28820 }, { "epoch": 0.79, "learning_rate": 2.2847513410764245e-06, "loss": 1.2913, "step": 28821 }, { "epoch": 0.79, "learning_rate": 2.2841886485161747e-06, "loss": 1.3413, "step": 28822 }, { "epoch": 0.79, "learning_rate": 2.283626016320805e-06, "loss": 1.281, "step": 28823 }, { "epoch": 0.79, "learning_rate": 2.2830634444947165e-06, "loss": 1.2192, "step": 28824 }, { "epoch": 0.79, "learning_rate": 2.2825009330423085e-06, "loss": 1.3572, "step": 28825 }, { "epoch": 0.79, "learning_rate": 2.281938481967987e-06, "loss": 1.1624, "step": 28826 }, { "epoch": 0.79, "learning_rate": 2.2813760912761498e-06, "loss": 1.3232, "step": 28827 }, { "epoch": 0.79, "learning_rate": 2.2808137609711955e-06, "loss": 1.2478, "step": 28828 }, { "epoch": 0.79, "learning_rate": 2.2802514910575223e-06, "loss": 1.2886, "step": 28829 }, { "epoch": 0.79, "learning_rate": 2.2796892815395345e-06, "loss": 1.1313, "step": 28830 }, { "epoch": 0.79, "learning_rate": 2.279127132421627e-06, "loss": 1.2991, "step": 28831 }, { "epoch": 0.79, "learning_rate": 2.2785650437081954e-06, "loss": 1.2363, "step": 28832 }, { "epoch": 0.79, "learning_rate": 2.2780030154036426e-06, "loss": 1.3831, "step": 28833 }, { "epoch": 0.79, "learning_rate": 2.277441047512361e-06, "loss": 1.2766, "step": 28834 }, { "epoch": 0.79, "learning_rate": 2.2768791400387546e-06, "loss": 1.0237, "step": 28835 }, { "epoch": 0.79, "learning_rate": 2.2763172929872078e-06, "loss": 1.2344, "step": 28836 }, { "epoch": 0.79, "learning_rate": 2.275755506362126e-06, "loss": 1.3157, "step": 28837 }, { "epoch": 0.79, "learning_rate": 2.275193780167898e-06, "loss": 1.1897, "step": 28838 }, { "epoch": 0.79, "learning_rate": 2.2746321144089276e-06, "loss": 1.2637, "step": 28839 }, { "epoch": 0.79, "learning_rate": 2.2740705090895966e-06, "loss": 1.1902, "step": 28840 }, { "epoch": 0.79, "learning_rate": 2.273508964214308e-06, "loss": 1.6577, "step": 28841 }, { "epoch": 0.79, "learning_rate": 2.2729474797874483e-06, "loss": 1.3152, "step": 28842 }, { "epoch": 0.79, "learning_rate": 2.27238605581342e-06, "loss": 1.2659, "step": 28843 }, { "epoch": 0.79, "learning_rate": 2.271824692296605e-06, "loss": 1.228, "step": 28844 }, { "epoch": 0.79, "learning_rate": 2.2712633892414017e-06, "loss": 1.1853, "step": 28845 }, { "epoch": 0.79, "learning_rate": 2.270702146652196e-06, "loss": 1.6797, "step": 28846 }, { "epoch": 0.79, "learning_rate": 2.270140964533385e-06, "loss": 1.2178, "step": 28847 }, { "epoch": 0.79, "learning_rate": 2.269579842889357e-06, "loss": 1.2258, "step": 28848 }, { "epoch": 0.79, "learning_rate": 2.269018781724498e-06, "loss": 1.2754, "step": 28849 }, { "epoch": 0.79, "learning_rate": 2.268457781043203e-06, "loss": 1.3191, "step": 28850 }, { "epoch": 0.79, "learning_rate": 2.267896840849859e-06, "loss": 1.218, "step": 28851 }, { "epoch": 0.79, "learning_rate": 2.2673359611488556e-06, "loss": 1.2512, "step": 28852 }, { "epoch": 0.79, "learning_rate": 2.266775141944575e-06, "loss": 1.2751, "step": 28853 }, { "epoch": 0.79, "learning_rate": 2.2662143832414118e-06, "loss": 1.2468, "step": 28854 }, { "epoch": 0.79, "learning_rate": 2.2656536850437516e-06, "loss": 1.2888, "step": 28855 }, { "epoch": 0.79, "learning_rate": 2.2650930473559796e-06, "loss": 1.1753, "step": 28856 }, { "epoch": 0.79, "learning_rate": 2.26453247018248e-06, "loss": 1.3362, "step": 28857 }, { "epoch": 0.79, "learning_rate": 2.263971953527644e-06, "loss": 1.4087, "step": 28858 }, { "epoch": 0.79, "learning_rate": 2.263411497395853e-06, "loss": 1.3989, "step": 28859 }, { "epoch": 0.79, "learning_rate": 2.262851101791492e-06, "loss": 1.0615, "step": 28860 }, { "epoch": 0.79, "learning_rate": 2.2622907667189443e-06, "loss": 1.1794, "step": 28861 }, { "epoch": 0.79, "learning_rate": 2.2617304921825965e-06, "loss": 1.0212, "step": 28862 }, { "epoch": 0.79, "learning_rate": 2.2611702781868305e-06, "loss": 1.3579, "step": 28863 }, { "epoch": 0.79, "learning_rate": 2.260610124736028e-06, "loss": 1.2405, "step": 28864 }, { "epoch": 0.79, "learning_rate": 2.2600500318345742e-06, "loss": 1.2795, "step": 28865 }, { "epoch": 0.79, "learning_rate": 2.259489999486849e-06, "loss": 1.2761, "step": 28866 }, { "epoch": 0.79, "learning_rate": 2.2589300276972346e-06, "loss": 1.3086, "step": 28867 }, { "epoch": 0.79, "learning_rate": 2.25837011647011e-06, "loss": 1.3098, "step": 28868 }, { "epoch": 0.79, "learning_rate": 2.257810265809859e-06, "loss": 1.261, "step": 28869 }, { "epoch": 0.79, "learning_rate": 2.257250475720859e-06, "loss": 1.176, "step": 28870 }, { "epoch": 0.79, "learning_rate": 2.2566907462074918e-06, "loss": 1.1875, "step": 28871 }, { "epoch": 0.79, "learning_rate": 2.2561310772741306e-06, "loss": 1.604, "step": 28872 }, { "epoch": 0.79, "learning_rate": 2.2555714689251627e-06, "loss": 1.1931, "step": 28873 }, { "epoch": 0.79, "learning_rate": 2.2550119211649613e-06, "loss": 1.2202, "step": 28874 }, { "epoch": 0.79, "learning_rate": 2.2544524339979047e-06, "loss": 1.3032, "step": 28875 }, { "epoch": 0.79, "learning_rate": 2.253893007428368e-06, "loss": 1.0963, "step": 28876 }, { "epoch": 0.79, "learning_rate": 2.253333641460732e-06, "loss": 1.1475, "step": 28877 }, { "epoch": 0.79, "learning_rate": 2.2527743360993713e-06, "loss": 1.3503, "step": 28878 }, { "epoch": 0.79, "learning_rate": 2.2522150913486574e-06, "loss": 1.307, "step": 28879 }, { "epoch": 0.79, "learning_rate": 2.2516559072129727e-06, "loss": 1.3235, "step": 28880 }, { "epoch": 0.79, "learning_rate": 2.251096783696687e-06, "loss": 1.1853, "step": 28881 }, { "epoch": 0.79, "learning_rate": 2.25053772080418e-06, "loss": 1.387, "step": 28882 }, { "epoch": 0.79, "learning_rate": 2.2499787185398168e-06, "loss": 1.2947, "step": 28883 }, { "epoch": 0.79, "learning_rate": 2.2494197769079797e-06, "loss": 1.2393, "step": 28884 }, { "epoch": 0.79, "learning_rate": 2.248860895913034e-06, "loss": 1.1638, "step": 28885 }, { "epoch": 0.79, "learning_rate": 2.248302075559361e-06, "loss": 1.2881, "step": 28886 }, { "epoch": 0.79, "learning_rate": 2.247743315851323e-06, "loss": 1.353, "step": 28887 }, { "epoch": 0.79, "learning_rate": 2.2471846167932975e-06, "loss": 1.2036, "step": 28888 }, { "epoch": 0.79, "learning_rate": 2.2466259783896515e-06, "loss": 1.4358, "step": 28889 }, { "epoch": 0.79, "learning_rate": 2.2460674006447647e-06, "loss": 1.2939, "step": 28890 }, { "epoch": 0.79, "learning_rate": 2.2455088835629936e-06, "loss": 1.3428, "step": 28891 }, { "epoch": 0.79, "learning_rate": 2.2449504271487178e-06, "loss": 1.1855, "step": 28892 }, { "epoch": 0.79, "learning_rate": 2.2443920314062993e-06, "loss": 1.2949, "step": 28893 }, { "epoch": 0.79, "learning_rate": 2.2438336963401153e-06, "loss": 1.395, "step": 28894 }, { "epoch": 0.79, "learning_rate": 2.2432754219545285e-06, "loss": 1.3887, "step": 28895 }, { "epoch": 0.79, "learning_rate": 2.242717208253904e-06, "loss": 1.1807, "step": 28896 }, { "epoch": 0.79, "learning_rate": 2.2421590552426154e-06, "loss": 1.1521, "step": 28897 }, { "epoch": 0.79, "learning_rate": 2.2416009629250258e-06, "loss": 1.26, "step": 28898 }, { "epoch": 0.79, "learning_rate": 2.2410429313055025e-06, "loss": 1.1655, "step": 28899 }, { "epoch": 0.79, "learning_rate": 2.2404849603884083e-06, "loss": 1.2639, "step": 28900 }, { "epoch": 0.79, "learning_rate": 2.2399270501781133e-06, "loss": 1.438, "step": 28901 }, { "epoch": 0.79, "learning_rate": 2.23936920067898e-06, "loss": 1.2263, "step": 28902 }, { "epoch": 0.79, "learning_rate": 2.238811411895374e-06, "loss": 1.3804, "step": 28903 }, { "epoch": 0.79, "learning_rate": 2.238253683831654e-06, "loss": 1.291, "step": 28904 }, { "epoch": 0.79, "learning_rate": 2.2376960164921902e-06, "loss": 1.3965, "step": 28905 }, { "epoch": 0.79, "learning_rate": 2.2371384098813433e-06, "loss": 1.3857, "step": 28906 }, { "epoch": 0.79, "learning_rate": 2.2365808640034736e-06, "loss": 1.3142, "step": 28907 }, { "epoch": 0.79, "learning_rate": 2.2360233788629438e-06, "loss": 1.416, "step": 28908 }, { "epoch": 0.79, "learning_rate": 2.2354659544641177e-06, "loss": 1.2495, "step": 28909 }, { "epoch": 0.79, "learning_rate": 2.2349085908113555e-06, "loss": 1.3516, "step": 28910 }, { "epoch": 0.79, "learning_rate": 2.2343512879090135e-06, "loss": 1.2815, "step": 28911 }, { "epoch": 0.79, "learning_rate": 2.2337940457614593e-06, "loss": 1.2559, "step": 28912 }, { "epoch": 0.79, "learning_rate": 2.2332368643730472e-06, "loss": 1.3599, "step": 28913 }, { "epoch": 0.79, "learning_rate": 2.2326797437481386e-06, "loss": 1.2649, "step": 28914 }, { "epoch": 0.79, "learning_rate": 2.232122683891088e-06, "loss": 1.1904, "step": 28915 }, { "epoch": 0.79, "learning_rate": 2.2315656848062593e-06, "loss": 1.2266, "step": 28916 }, { "epoch": 0.79, "learning_rate": 2.231008746498009e-06, "loss": 1.2935, "step": 28917 }, { "epoch": 0.79, "learning_rate": 2.230451868970692e-06, "loss": 1.2549, "step": 28918 }, { "epoch": 0.79, "learning_rate": 2.229895052228663e-06, "loss": 1.2073, "step": 28919 }, { "epoch": 0.79, "learning_rate": 2.2293382962762856e-06, "loss": 1.3953, "step": 28920 }, { "epoch": 0.79, "learning_rate": 2.2287816011179098e-06, "loss": 1.2886, "step": 28921 }, { "epoch": 0.79, "learning_rate": 2.2282249667578936e-06, "loss": 1.3889, "step": 28922 }, { "epoch": 0.79, "learning_rate": 2.227668393200587e-06, "loss": 1.2742, "step": 28923 }, { "epoch": 0.79, "learning_rate": 2.227111880450351e-06, "loss": 1.281, "step": 28924 }, { "epoch": 0.79, "learning_rate": 2.2265554285115377e-06, "loss": 1.3496, "step": 28925 }, { "epoch": 0.79, "learning_rate": 2.2259990373884956e-06, "loss": 1.1104, "step": 28926 }, { "epoch": 0.79, "learning_rate": 2.2254427070855846e-06, "loss": 1.4121, "step": 28927 }, { "epoch": 0.79, "learning_rate": 2.224886437607151e-06, "loss": 1.3276, "step": 28928 }, { "epoch": 0.79, "learning_rate": 2.224330228957552e-06, "loss": 1.2869, "step": 28929 }, { "epoch": 0.79, "learning_rate": 2.223774081141138e-06, "loss": 1.2368, "step": 28930 }, { "epoch": 0.79, "learning_rate": 2.223217994162259e-06, "loss": 1.3022, "step": 28931 }, { "epoch": 0.79, "learning_rate": 2.2226619680252615e-06, "loss": 1.3223, "step": 28932 }, { "epoch": 0.79, "learning_rate": 2.222106002734503e-06, "loss": 1.3394, "step": 28933 }, { "epoch": 0.79, "learning_rate": 2.2215500982943305e-06, "loss": 1.2266, "step": 28934 }, { "epoch": 0.79, "learning_rate": 2.220994254709091e-06, "loss": 1.2798, "step": 28935 }, { "epoch": 0.79, "learning_rate": 2.2204384719831328e-06, "loss": 1.2803, "step": 28936 }, { "epoch": 0.79, "learning_rate": 2.2198827501208077e-06, "loss": 1.3936, "step": 28937 }, { "epoch": 0.79, "learning_rate": 2.2193270891264616e-06, "loss": 1.231, "step": 28938 }, { "epoch": 0.79, "learning_rate": 2.218771489004442e-06, "loss": 1.2422, "step": 28939 }, { "epoch": 0.79, "learning_rate": 2.2182159497590927e-06, "loss": 1.2905, "step": 28940 }, { "epoch": 0.79, "learning_rate": 2.217660471394766e-06, "loss": 1.0583, "step": 28941 }, { "epoch": 0.79, "learning_rate": 2.217105053915802e-06, "loss": 1.2085, "step": 28942 }, { "epoch": 0.79, "learning_rate": 2.2165496973265478e-06, "loss": 1.1812, "step": 28943 }, { "epoch": 0.79, "learning_rate": 2.2159944016313508e-06, "loss": 1.1912, "step": 28944 }, { "epoch": 0.79, "learning_rate": 2.215439166834552e-06, "loss": 1.0566, "step": 28945 }, { "epoch": 0.79, "learning_rate": 2.2148839929404985e-06, "loss": 1.4028, "step": 28946 }, { "epoch": 0.79, "learning_rate": 2.214328879953528e-06, "loss": 1.1626, "step": 28947 }, { "epoch": 0.79, "learning_rate": 2.2137738278779906e-06, "loss": 1.2615, "step": 28948 }, { "epoch": 0.79, "learning_rate": 2.213218836718225e-06, "loss": 1.0854, "step": 28949 }, { "epoch": 0.79, "learning_rate": 2.2126639064785738e-06, "loss": 1.0662, "step": 28950 }, { "epoch": 0.79, "learning_rate": 2.2121090371633745e-06, "loss": 1.2571, "step": 28951 }, { "epoch": 0.79, "learning_rate": 2.2115542287769767e-06, "loss": 1.2937, "step": 28952 }, { "epoch": 0.79, "learning_rate": 2.2109994813237146e-06, "loss": 1.2595, "step": 28953 }, { "epoch": 0.79, "learning_rate": 2.210444794807931e-06, "loss": 1.2463, "step": 28954 }, { "epoch": 0.79, "learning_rate": 2.2098901692339615e-06, "loss": 1.354, "step": 28955 }, { "epoch": 0.79, "learning_rate": 2.2093356046061496e-06, "loss": 1.3718, "step": 28956 }, { "epoch": 0.79, "learning_rate": 2.208781100928834e-06, "loss": 1.3005, "step": 28957 }, { "epoch": 0.79, "learning_rate": 2.2082266582063485e-06, "loss": 1.0962, "step": 28958 }, { "epoch": 0.79, "learning_rate": 2.2076722764430358e-06, "loss": 1.1838, "step": 28959 }, { "epoch": 0.79, "learning_rate": 2.207117955643229e-06, "loss": 1.3208, "step": 28960 }, { "epoch": 0.79, "learning_rate": 2.206563695811271e-06, "loss": 1.3179, "step": 28961 }, { "epoch": 0.79, "learning_rate": 2.20600949695149e-06, "loss": 1.2229, "step": 28962 }, { "epoch": 0.79, "learning_rate": 2.205455359068227e-06, "loss": 1.1002, "step": 28963 }, { "epoch": 0.79, "learning_rate": 2.2049012821658144e-06, "loss": 1.4341, "step": 28964 }, { "epoch": 0.79, "learning_rate": 2.204347266248593e-06, "loss": 1.1899, "step": 28965 }, { "epoch": 0.79, "learning_rate": 2.2037933113208886e-06, "loss": 1.2634, "step": 28966 }, { "epoch": 0.79, "learning_rate": 2.203239417387042e-06, "loss": 1.4199, "step": 28967 }, { "epoch": 0.79, "learning_rate": 2.202685584451381e-06, "loss": 1.1931, "step": 28968 }, { "epoch": 0.79, "learning_rate": 2.2021318125182455e-06, "loss": 1.2693, "step": 28969 }, { "epoch": 0.79, "learning_rate": 2.2015781015919603e-06, "loss": 1.3608, "step": 28970 }, { "epoch": 0.79, "learning_rate": 2.20102445167686e-06, "loss": 1.2734, "step": 28971 }, { "epoch": 0.79, "learning_rate": 2.2004708627772797e-06, "loss": 1.3542, "step": 28972 }, { "epoch": 0.79, "learning_rate": 2.1999173348975478e-06, "loss": 1.2705, "step": 28973 }, { "epoch": 0.79, "learning_rate": 2.199363868041995e-06, "loss": 1.1633, "step": 28974 }, { "epoch": 0.79, "learning_rate": 2.1988104622149487e-06, "loss": 1.1326, "step": 28975 }, { "epoch": 0.79, "learning_rate": 2.1982571174207433e-06, "loss": 1.2488, "step": 28976 }, { "epoch": 0.79, "learning_rate": 2.1977038336637058e-06, "loss": 1.1274, "step": 28977 }, { "epoch": 0.79, "learning_rate": 2.1971506109481645e-06, "loss": 1.1453, "step": 28978 }, { "epoch": 0.79, "learning_rate": 2.196597449278445e-06, "loss": 1.1421, "step": 28979 }, { "epoch": 0.79, "learning_rate": 2.1960443486588813e-06, "loss": 1.2148, "step": 28980 }, { "epoch": 0.79, "learning_rate": 2.195491309093796e-06, "loss": 1.3291, "step": 28981 }, { "epoch": 0.79, "learning_rate": 2.194938330587516e-06, "loss": 1.3079, "step": 28982 }, { "epoch": 0.79, "learning_rate": 2.1943854131443666e-06, "loss": 1.187, "step": 28983 }, { "epoch": 0.79, "learning_rate": 2.193832556768678e-06, "loss": 1.0999, "step": 28984 }, { "epoch": 0.79, "learning_rate": 2.1932797614647716e-06, "loss": 1.2634, "step": 28985 }, { "epoch": 0.79, "learning_rate": 2.192727027236975e-06, "loss": 1.2117, "step": 28986 }, { "epoch": 0.79, "learning_rate": 2.1921743540896066e-06, "loss": 1.1311, "step": 28987 }, { "epoch": 0.79, "learning_rate": 2.1916217420269994e-06, "loss": 1.1492, "step": 28988 }, { "epoch": 0.79, "learning_rate": 2.19106919105347e-06, "loss": 1.1851, "step": 28989 }, { "epoch": 0.79, "learning_rate": 2.190516701173341e-06, "loss": 1.2148, "step": 28990 }, { "epoch": 0.79, "learning_rate": 2.1899642723909398e-06, "loss": 1.2285, "step": 28991 }, { "epoch": 0.79, "learning_rate": 2.1894119047105854e-06, "loss": 1.4128, "step": 28992 }, { "epoch": 0.79, "learning_rate": 2.1888595981366003e-06, "loss": 1.3379, "step": 28993 }, { "epoch": 0.79, "learning_rate": 2.1883073526733013e-06, "loss": 1.1313, "step": 28994 }, { "epoch": 0.79, "learning_rate": 2.1877551683250155e-06, "loss": 1.2874, "step": 28995 }, { "epoch": 0.79, "learning_rate": 2.187203045096059e-06, "loss": 1.1687, "step": 28996 }, { "epoch": 0.79, "learning_rate": 2.1866509829907524e-06, "loss": 1.2134, "step": 28997 }, { "epoch": 0.79, "learning_rate": 2.1860989820134115e-06, "loss": 1.4282, "step": 28998 }, { "epoch": 0.79, "learning_rate": 2.185547042168361e-06, "loss": 1.3687, "step": 28999 }, { "epoch": 0.79, "learning_rate": 2.1849951634599154e-06, "loss": 1.2776, "step": 29000 }, { "epoch": 0.79, "learning_rate": 2.184443345892393e-06, "loss": 1.0776, "step": 29001 }, { "epoch": 0.79, "learning_rate": 2.1838915894701074e-06, "loss": 1.3533, "step": 29002 }, { "epoch": 0.79, "learning_rate": 2.1833398941973794e-06, "loss": 1.2249, "step": 29003 }, { "epoch": 0.79, "learning_rate": 2.1827882600785287e-06, "loss": 1.3408, "step": 29004 }, { "epoch": 0.79, "learning_rate": 2.1822366871178623e-06, "loss": 1.1018, "step": 29005 }, { "epoch": 0.79, "learning_rate": 2.1816851753197023e-06, "loss": 1.2236, "step": 29006 }, { "epoch": 0.79, "learning_rate": 2.1811337246883592e-06, "loss": 1.3098, "step": 29007 }, { "epoch": 0.79, "learning_rate": 2.180582335228153e-06, "loss": 1.1533, "step": 29008 }, { "epoch": 0.79, "learning_rate": 2.1800310069433896e-06, "loss": 1.2449, "step": 29009 }, { "epoch": 0.79, "learning_rate": 2.179479739838388e-06, "loss": 1.1899, "step": 29010 }, { "epoch": 0.79, "learning_rate": 2.1789285339174583e-06, "loss": 1.2122, "step": 29011 }, { "epoch": 0.79, "learning_rate": 2.178377389184918e-06, "loss": 1.2446, "step": 29012 }, { "epoch": 0.79, "learning_rate": 2.17782630564507e-06, "loss": 1.2722, "step": 29013 }, { "epoch": 0.79, "learning_rate": 2.1772752833022338e-06, "loss": 1.3269, "step": 29014 }, { "epoch": 0.79, "learning_rate": 2.1767243221607137e-06, "loss": 1.1289, "step": 29015 }, { "epoch": 0.79, "learning_rate": 2.17617342222483e-06, "loss": 1.2803, "step": 29016 }, { "epoch": 0.79, "learning_rate": 2.175622583498881e-06, "loss": 1.1995, "step": 29017 }, { "epoch": 0.79, "learning_rate": 2.175071805987181e-06, "loss": 1.2437, "step": 29018 }, { "epoch": 0.79, "learning_rate": 2.1745210896940425e-06, "loss": 1.2683, "step": 29019 }, { "epoch": 0.79, "learning_rate": 2.1739704346237724e-06, "loss": 1.1006, "step": 29020 }, { "epoch": 0.79, "learning_rate": 2.173419840780676e-06, "loss": 1.179, "step": 29021 }, { "epoch": 0.79, "learning_rate": 2.1728693081690598e-06, "loss": 1.2449, "step": 29022 }, { "epoch": 0.79, "learning_rate": 2.172318836793238e-06, "loss": 1.2587, "step": 29023 }, { "epoch": 0.79, "learning_rate": 2.171768426657511e-06, "loss": 1.2913, "step": 29024 }, { "epoch": 0.79, "learning_rate": 2.1712180777661874e-06, "loss": 1.1836, "step": 29025 }, { "epoch": 0.79, "learning_rate": 2.1706677901235695e-06, "loss": 1.3901, "step": 29026 }, { "epoch": 0.79, "learning_rate": 2.1701175637339677e-06, "loss": 1.1272, "step": 29027 }, { "epoch": 0.79, "learning_rate": 2.169567398601684e-06, "loss": 1.2629, "step": 29028 }, { "epoch": 0.79, "learning_rate": 2.169017294731024e-06, "loss": 1.4092, "step": 29029 }, { "epoch": 0.79, "learning_rate": 2.168467252126286e-06, "loss": 1.1941, "step": 29030 }, { "epoch": 0.79, "learning_rate": 2.1679172707917816e-06, "loss": 1.6831, "step": 29031 }, { "epoch": 0.79, "learning_rate": 2.1673673507318095e-06, "loss": 1.3577, "step": 29032 }, { "epoch": 0.79, "learning_rate": 2.166817491950668e-06, "loss": 1.2307, "step": 29033 }, { "epoch": 0.79, "learning_rate": 2.1662676944526674e-06, "loss": 1.334, "step": 29034 }, { "epoch": 0.79, "learning_rate": 2.1657179582421028e-06, "loss": 1.1863, "step": 29035 }, { "epoch": 0.79, "learning_rate": 2.165168283323279e-06, "loss": 1.1792, "step": 29036 }, { "epoch": 0.79, "learning_rate": 2.16461866970049e-06, "loss": 1.0817, "step": 29037 }, { "epoch": 0.79, "learning_rate": 2.1640691173780438e-06, "loss": 1.3049, "step": 29038 }, { "epoch": 0.79, "learning_rate": 2.1635196263602354e-06, "loss": 1.3247, "step": 29039 }, { "epoch": 0.79, "learning_rate": 2.162970196651365e-06, "loss": 1.2297, "step": 29040 }, { "epoch": 0.79, "learning_rate": 2.162420828255728e-06, "loss": 1.259, "step": 29041 }, { "epoch": 0.79, "learning_rate": 2.1618715211776274e-06, "loss": 1.3123, "step": 29042 }, { "epoch": 0.79, "learning_rate": 2.161322275421358e-06, "loss": 1.3088, "step": 29043 }, { "epoch": 0.79, "learning_rate": 2.160773090991217e-06, "loss": 1.3252, "step": 29044 }, { "epoch": 0.79, "learning_rate": 2.1602239678914995e-06, "loss": 1.2869, "step": 29045 }, { "epoch": 0.79, "learning_rate": 2.1596749061265053e-06, "loss": 1.2676, "step": 29046 }, { "epoch": 0.79, "learning_rate": 2.1591259057005276e-06, "loss": 1.1707, "step": 29047 }, { "epoch": 0.79, "learning_rate": 2.1585769666178615e-06, "loss": 1.3008, "step": 29048 }, { "epoch": 0.79, "learning_rate": 2.1580280888828e-06, "loss": 1.3333, "step": 29049 }, { "epoch": 0.79, "learning_rate": 2.1574792724996383e-06, "loss": 1.2361, "step": 29050 }, { "epoch": 0.79, "learning_rate": 2.1569305174726763e-06, "loss": 1.1143, "step": 29051 }, { "epoch": 0.79, "learning_rate": 2.1563818238061975e-06, "loss": 1.321, "step": 29052 }, { "epoch": 0.79, "learning_rate": 2.1558331915045004e-06, "loss": 1.2766, "step": 29053 }, { "epoch": 0.79, "learning_rate": 2.1552846205718748e-06, "loss": 1.2693, "step": 29054 }, { "epoch": 0.79, "learning_rate": 2.1547361110126175e-06, "loss": 1.3906, "step": 29055 }, { "epoch": 0.79, "learning_rate": 2.154187662831011e-06, "loss": 1.2678, "step": 29056 }, { "epoch": 0.79, "learning_rate": 2.153639276031353e-06, "loss": 1.3083, "step": 29057 }, { "epoch": 0.79, "learning_rate": 2.1530909506179298e-06, "loss": 1.3154, "step": 29058 }, { "epoch": 0.79, "learning_rate": 2.1525426865950383e-06, "loss": 1.385, "step": 29059 }, { "epoch": 0.79, "learning_rate": 2.151994483966956e-06, "loss": 1.1423, "step": 29060 }, { "epoch": 0.79, "learning_rate": 2.151446342737983e-06, "loss": 1.2756, "step": 29061 }, { "epoch": 0.79, "learning_rate": 2.1508982629123996e-06, "loss": 1.3035, "step": 29062 }, { "epoch": 0.79, "learning_rate": 2.150350244494502e-06, "loss": 1.3296, "step": 29063 }, { "epoch": 0.79, "learning_rate": 2.1498022874885695e-06, "loss": 1.1846, "step": 29064 }, { "epoch": 0.79, "learning_rate": 2.1492543918988906e-06, "loss": 1.2332, "step": 29065 }, { "epoch": 0.79, "learning_rate": 2.1487065577297572e-06, "loss": 1.3308, "step": 29066 }, { "epoch": 0.79, "learning_rate": 2.1481587849854513e-06, "loss": 1.3792, "step": 29067 }, { "epoch": 0.79, "learning_rate": 2.1476110736702595e-06, "loss": 1.2117, "step": 29068 }, { "epoch": 0.79, "learning_rate": 2.1470634237884625e-06, "loss": 1.1992, "step": 29069 }, { "epoch": 0.79, "learning_rate": 2.146515835344353e-06, "loss": 1.373, "step": 29070 }, { "epoch": 0.79, "learning_rate": 2.145968308342209e-06, "loss": 1.2329, "step": 29071 }, { "epoch": 0.79, "learning_rate": 2.1454208427863166e-06, "loss": 1.1677, "step": 29072 }, { "epoch": 0.79, "learning_rate": 2.1448734386809543e-06, "loss": 1.2402, "step": 29073 }, { "epoch": 0.79, "learning_rate": 2.1443260960304125e-06, "loss": 1.199, "step": 29074 }, { "epoch": 0.79, "learning_rate": 2.143778814838968e-06, "loss": 1.1758, "step": 29075 }, { "epoch": 0.79, "learning_rate": 2.143231595110905e-06, "loss": 1.3203, "step": 29076 }, { "epoch": 0.79, "learning_rate": 2.142684436850501e-06, "loss": 1.4399, "step": 29077 }, { "epoch": 0.79, "learning_rate": 2.1421373400620406e-06, "loss": 1.1201, "step": 29078 }, { "epoch": 0.79, "learning_rate": 2.1415903047498032e-06, "loss": 1.1833, "step": 29079 }, { "epoch": 0.79, "learning_rate": 2.1410433309180657e-06, "loss": 1.0891, "step": 29080 }, { "epoch": 0.79, "learning_rate": 2.140496418571112e-06, "loss": 1.353, "step": 29081 }, { "epoch": 0.79, "learning_rate": 2.139949567713218e-06, "loss": 1.209, "step": 29082 }, { "epoch": 0.79, "learning_rate": 2.139402778348663e-06, "loss": 1.385, "step": 29083 }, { "epoch": 0.79, "learning_rate": 2.138856050481721e-06, "loss": 1.3262, "step": 29084 }, { "epoch": 0.79, "learning_rate": 2.1383093841166768e-06, "loss": 1.3672, "step": 29085 }, { "epoch": 0.79, "learning_rate": 2.137762779257803e-06, "loss": 1.2756, "step": 29086 }, { "epoch": 0.79, "learning_rate": 2.137216235909375e-06, "loss": 1.2893, "step": 29087 }, { "epoch": 0.79, "learning_rate": 2.1366697540756676e-06, "loss": 1.2454, "step": 29088 }, { "epoch": 0.79, "learning_rate": 2.136123333760961e-06, "loss": 1.3496, "step": 29089 }, { "epoch": 0.79, "learning_rate": 2.1355769749695275e-06, "loss": 1.0923, "step": 29090 }, { "epoch": 0.79, "learning_rate": 2.1350306777056416e-06, "loss": 1.1003, "step": 29091 }, { "epoch": 0.79, "learning_rate": 2.1344844419735757e-06, "loss": 1.2808, "step": 29092 }, { "epoch": 0.79, "learning_rate": 2.1339382677776068e-06, "loss": 1.1536, "step": 29093 }, { "epoch": 0.79, "learning_rate": 2.133392155122006e-06, "loss": 1.1721, "step": 29094 }, { "epoch": 0.79, "learning_rate": 2.1328461040110424e-06, "loss": 1.4102, "step": 29095 }, { "epoch": 0.79, "learning_rate": 2.1323001144489953e-06, "loss": 1.3203, "step": 29096 }, { "epoch": 0.79, "learning_rate": 2.1317541864401303e-06, "loss": 1.2236, "step": 29097 }, { "epoch": 0.79, "learning_rate": 2.1312083199887244e-06, "loss": 1.2664, "step": 29098 }, { "epoch": 0.79, "learning_rate": 2.13066251509904e-06, "loss": 1.2373, "step": 29099 }, { "epoch": 0.79, "learning_rate": 2.1301167717753546e-06, "loss": 1.3152, "step": 29100 }, { "epoch": 0.79, "learning_rate": 2.1295710900219312e-06, "loss": 1.1934, "step": 29101 }, { "epoch": 0.79, "learning_rate": 2.129025469843049e-06, "loss": 1.2319, "step": 29102 }, { "epoch": 0.79, "learning_rate": 2.1284799112429643e-06, "loss": 1.4109, "step": 29103 }, { "epoch": 0.79, "learning_rate": 2.1279344142259538e-06, "loss": 1.2073, "step": 29104 }, { "epoch": 0.79, "learning_rate": 2.127388978796281e-06, "loss": 1.3191, "step": 29105 }, { "epoch": 0.79, "learning_rate": 2.12684360495822e-06, "loss": 1.3003, "step": 29106 }, { "epoch": 0.79, "learning_rate": 2.126298292716027e-06, "loss": 1.293, "step": 29107 }, { "epoch": 0.79, "learning_rate": 2.125753042073976e-06, "loss": 1.2019, "step": 29108 }, { "epoch": 0.79, "learning_rate": 2.1252078530363276e-06, "loss": 1.2939, "step": 29109 }, { "epoch": 0.79, "learning_rate": 2.124662725607356e-06, "loss": 1.0789, "step": 29110 }, { "epoch": 0.8, "learning_rate": 2.1241176597913138e-06, "loss": 1.1924, "step": 29111 }, { "epoch": 0.8, "learning_rate": 2.123572655592472e-06, "loss": 1.6733, "step": 29112 }, { "epoch": 0.8, "learning_rate": 2.1230277130150966e-06, "loss": 1.1224, "step": 29113 }, { "epoch": 0.8, "learning_rate": 2.1224828320634483e-06, "loss": 1.3052, "step": 29114 }, { "epoch": 0.8, "learning_rate": 2.121938012741791e-06, "loss": 1.248, "step": 29115 }, { "epoch": 0.8, "learning_rate": 2.1213932550543824e-06, "loss": 1.386, "step": 29116 }, { "epoch": 0.8, "learning_rate": 2.1208485590054906e-06, "loss": 1.2036, "step": 29117 }, { "epoch": 0.8, "learning_rate": 2.1203039245993763e-06, "loss": 1.127, "step": 29118 }, { "epoch": 0.8, "learning_rate": 2.119759351840297e-06, "loss": 1.293, "step": 29119 }, { "epoch": 0.8, "learning_rate": 2.119214840732513e-06, "loss": 1.3318, "step": 29120 }, { "epoch": 0.8, "learning_rate": 2.1186703912802887e-06, "loss": 1.2449, "step": 29121 }, { "epoch": 0.8, "learning_rate": 2.1181260034878813e-06, "loss": 1.1863, "step": 29122 }, { "epoch": 0.8, "learning_rate": 2.1175816773595504e-06, "loss": 1.1934, "step": 29123 }, { "epoch": 0.8, "learning_rate": 2.1170374128995507e-06, "loss": 1.1436, "step": 29124 }, { "epoch": 0.8, "learning_rate": 2.116493210112146e-06, "loss": 1.1958, "step": 29125 }, { "epoch": 0.8, "learning_rate": 2.1159490690015915e-06, "loss": 1.2769, "step": 29126 }, { "epoch": 0.8, "learning_rate": 2.115404989572142e-06, "loss": 1.5535, "step": 29127 }, { "epoch": 0.8, "learning_rate": 2.1148609718280576e-06, "loss": 1.2651, "step": 29128 }, { "epoch": 0.8, "learning_rate": 2.114317015773595e-06, "loss": 1.3457, "step": 29129 }, { "epoch": 0.8, "learning_rate": 2.1137731214130063e-06, "loss": 1.3813, "step": 29130 }, { "epoch": 0.8, "learning_rate": 2.1132292887505456e-06, "loss": 1.1953, "step": 29131 }, { "epoch": 0.8, "learning_rate": 2.1126855177904736e-06, "loss": 1.2732, "step": 29132 }, { "epoch": 0.8, "learning_rate": 2.1121418085370414e-06, "loss": 1.3713, "step": 29133 }, { "epoch": 0.8, "learning_rate": 2.1115981609945026e-06, "loss": 1.3418, "step": 29134 }, { "epoch": 0.8, "learning_rate": 2.1110545751671074e-06, "loss": 1.3721, "step": 29135 }, { "epoch": 0.8, "learning_rate": 2.1105110510591143e-06, "loss": 1.2798, "step": 29136 }, { "epoch": 0.8, "learning_rate": 2.109967588674773e-06, "loss": 1.1892, "step": 29137 }, { "epoch": 0.8, "learning_rate": 2.1094241880183355e-06, "loss": 1.2068, "step": 29138 }, { "epoch": 0.8, "learning_rate": 2.108880849094049e-06, "loss": 1.2957, "step": 29139 }, { "epoch": 0.8, "learning_rate": 2.1083375719061718e-06, "loss": 1.3638, "step": 29140 }, { "epoch": 0.8, "learning_rate": 2.10779435645895e-06, "loss": 1.3245, "step": 29141 }, { "epoch": 0.8, "learning_rate": 2.1072512027566316e-06, "loss": 1.2883, "step": 29142 }, { "epoch": 0.8, "learning_rate": 2.1067081108034705e-06, "loss": 1.218, "step": 29143 }, { "epoch": 0.8, "learning_rate": 2.1061650806037103e-06, "loss": 1.4189, "step": 29144 }, { "epoch": 0.8, "learning_rate": 2.105622112161609e-06, "loss": 1.4714, "step": 29145 }, { "epoch": 0.8, "learning_rate": 2.105079205481403e-06, "loss": 1.1118, "step": 29146 }, { "epoch": 0.8, "learning_rate": 2.104536360567346e-06, "loss": 1.1418, "step": 29147 }, { "epoch": 0.8, "learning_rate": 2.103993577423683e-06, "loss": 1.4036, "step": 29148 }, { "epoch": 0.8, "learning_rate": 2.1034508560546653e-06, "loss": 1.3323, "step": 29149 }, { "epoch": 0.8, "learning_rate": 2.1029081964645305e-06, "loss": 1.3418, "step": 29150 }, { "epoch": 0.8, "learning_rate": 2.1023655986575296e-06, "loss": 1.3201, "step": 29151 }, { "epoch": 0.8, "learning_rate": 2.1018230626379055e-06, "loss": 1.2197, "step": 29152 }, { "epoch": 0.8, "learning_rate": 2.1012805884099085e-06, "loss": 1.4287, "step": 29153 }, { "epoch": 0.8, "learning_rate": 2.1007381759777722e-06, "loss": 1.2905, "step": 29154 }, { "epoch": 0.8, "learning_rate": 2.1001958253457498e-06, "loss": 1.6758, "step": 29155 }, { "epoch": 0.8, "learning_rate": 2.099653536518077e-06, "loss": 1.1582, "step": 29156 }, { "epoch": 0.8, "learning_rate": 2.099111309499002e-06, "loss": 1.2751, "step": 29157 }, { "epoch": 0.8, "learning_rate": 2.098569144292766e-06, "loss": 1.1483, "step": 29158 }, { "epoch": 0.8, "learning_rate": 2.098027040903606e-06, "loss": 1.2386, "step": 29159 }, { "epoch": 0.8, "learning_rate": 2.0974849993357695e-06, "loss": 1.2385, "step": 29160 }, { "epoch": 0.8, "learning_rate": 2.096943019593495e-06, "loss": 1.3015, "step": 29161 }, { "epoch": 0.8, "learning_rate": 2.0964011016810217e-06, "loss": 1.2043, "step": 29162 }, { "epoch": 0.8, "learning_rate": 2.095859245602586e-06, "loss": 1.0798, "step": 29163 }, { "epoch": 0.8, "learning_rate": 2.0953174513624343e-06, "loss": 1.3218, "step": 29164 }, { "epoch": 0.8, "learning_rate": 2.0947757189648023e-06, "loss": 1.2419, "step": 29165 }, { "epoch": 0.8, "learning_rate": 2.094234048413927e-06, "loss": 1.2888, "step": 29166 }, { "epoch": 0.8, "learning_rate": 2.0936924397140447e-06, "loss": 1.1968, "step": 29167 }, { "epoch": 0.8, "learning_rate": 2.0931508928693966e-06, "loss": 1.0486, "step": 29168 }, { "epoch": 0.8, "learning_rate": 2.09260940788422e-06, "loss": 1.3618, "step": 29169 }, { "epoch": 0.8, "learning_rate": 2.0920679847627466e-06, "loss": 1.2251, "step": 29170 }, { "epoch": 0.8, "learning_rate": 2.0915266235092137e-06, "loss": 1.6226, "step": 29171 }, { "epoch": 0.8, "learning_rate": 2.0909853241278597e-06, "loss": 1.3145, "step": 29172 }, { "epoch": 0.8, "learning_rate": 2.090444086622918e-06, "loss": 1.3137, "step": 29173 }, { "epoch": 0.8, "learning_rate": 2.089902910998619e-06, "loss": 1.2593, "step": 29174 }, { "epoch": 0.8, "learning_rate": 2.0893617972592027e-06, "loss": 1.3206, "step": 29175 }, { "epoch": 0.8, "learning_rate": 2.0888207454089005e-06, "loss": 1.3306, "step": 29176 }, { "epoch": 0.8, "learning_rate": 2.088279755451944e-06, "loss": 1.3457, "step": 29177 }, { "epoch": 0.8, "learning_rate": 2.087738827392565e-06, "loss": 1.1677, "step": 29178 }, { "epoch": 0.8, "learning_rate": 2.087197961234998e-06, "loss": 1.2605, "step": 29179 }, { "epoch": 0.8, "learning_rate": 2.0866571569834737e-06, "loss": 1.3425, "step": 29180 }, { "epoch": 0.8, "learning_rate": 2.086116414642223e-06, "loss": 1.1455, "step": 29181 }, { "epoch": 0.8, "learning_rate": 2.0855757342154736e-06, "loss": 1.157, "step": 29182 }, { "epoch": 0.8, "learning_rate": 2.08503511570746e-06, "loss": 1.6675, "step": 29183 }, { "epoch": 0.8, "learning_rate": 2.0844945591224098e-06, "loss": 1.2622, "step": 29184 }, { "epoch": 0.8, "learning_rate": 2.0839540644645528e-06, "loss": 0.84, "step": 29185 }, { "epoch": 0.8, "learning_rate": 2.0834136317381137e-06, "loss": 1.165, "step": 29186 }, { "epoch": 0.8, "learning_rate": 2.0828732609473267e-06, "loss": 1.158, "step": 29187 }, { "epoch": 0.8, "learning_rate": 2.0823329520964153e-06, "loss": 1.3625, "step": 29188 }, { "epoch": 0.8, "learning_rate": 2.081792705189606e-06, "loss": 1.2634, "step": 29189 }, { "epoch": 0.8, "learning_rate": 2.0812525202311295e-06, "loss": 1.321, "step": 29190 }, { "epoch": 0.8, "learning_rate": 2.0807123972252077e-06, "loss": 1.2202, "step": 29191 }, { "epoch": 0.8, "learning_rate": 2.0801723361760706e-06, "loss": 1.3018, "step": 29192 }, { "epoch": 0.8, "learning_rate": 2.07963233708794e-06, "loss": 1.2019, "step": 29193 }, { "epoch": 0.8, "learning_rate": 2.0790923999650426e-06, "loss": 1.0908, "step": 29194 }, { "epoch": 0.8, "learning_rate": 2.078552524811599e-06, "loss": 1.2959, "step": 29195 }, { "epoch": 0.8, "learning_rate": 2.0780127116318373e-06, "loss": 1.2998, "step": 29196 }, { "epoch": 0.8, "learning_rate": 2.077472960429979e-06, "loss": 1.3726, "step": 29197 }, { "epoch": 0.8, "learning_rate": 2.0769332712102476e-06, "loss": 1.2358, "step": 29198 }, { "epoch": 0.8, "learning_rate": 2.0763936439768616e-06, "loss": 1.2385, "step": 29199 }, { "epoch": 0.8, "learning_rate": 2.0758540787340485e-06, "loss": 1.1118, "step": 29200 }, { "epoch": 0.8, "learning_rate": 2.075314575486027e-06, "loss": 1.293, "step": 29201 }, { "epoch": 0.8, "learning_rate": 2.0747751342370183e-06, "loss": 1.2295, "step": 29202 }, { "epoch": 0.8, "learning_rate": 2.0742357549912385e-06, "loss": 1.3281, "step": 29203 }, { "epoch": 0.8, "learning_rate": 2.0736964377529147e-06, "loss": 1.313, "step": 29204 }, { "epoch": 0.8, "learning_rate": 2.073157182526262e-06, "loss": 1.2939, "step": 29205 }, { "epoch": 0.8, "learning_rate": 2.0726179893154975e-06, "loss": 1.217, "step": 29206 }, { "epoch": 0.8, "learning_rate": 2.0720788581248452e-06, "loss": 1.2812, "step": 29207 }, { "epoch": 0.8, "learning_rate": 2.0715397889585197e-06, "loss": 1.4016, "step": 29208 }, { "epoch": 0.8, "learning_rate": 2.071000781820739e-06, "loss": 1.2314, "step": 29209 }, { "epoch": 0.8, "learning_rate": 2.070461836715717e-06, "loss": 1.2639, "step": 29210 }, { "epoch": 0.8, "learning_rate": 2.069922953647675e-06, "loss": 1.1486, "step": 29211 }, { "epoch": 0.8, "learning_rate": 2.0693841326208274e-06, "loss": 1.228, "step": 29212 }, { "epoch": 0.8, "learning_rate": 2.068845373639389e-06, "loss": 1.3015, "step": 29213 }, { "epoch": 0.8, "learning_rate": 2.068306676707572e-06, "loss": 1.259, "step": 29214 }, { "epoch": 0.8, "learning_rate": 2.0677680418295963e-06, "loss": 1.4482, "step": 29215 }, { "epoch": 0.8, "learning_rate": 2.067229469009674e-06, "loss": 1.3364, "step": 29216 }, { "epoch": 0.8, "learning_rate": 2.0666909582520178e-06, "loss": 1.1475, "step": 29217 }, { "epoch": 0.8, "learning_rate": 2.066152509560838e-06, "loss": 1.2668, "step": 29218 }, { "epoch": 0.8, "learning_rate": 2.0656141229403535e-06, "loss": 1.24, "step": 29219 }, { "epoch": 0.8, "learning_rate": 2.0650757983947733e-06, "loss": 1.2024, "step": 29220 }, { "epoch": 0.8, "learning_rate": 2.0645375359283047e-06, "loss": 1.3672, "step": 29221 }, { "epoch": 0.8, "learning_rate": 2.0639993355451672e-06, "loss": 1.3501, "step": 29222 }, { "epoch": 0.8, "learning_rate": 2.0634611972495634e-06, "loss": 1.2451, "step": 29223 }, { "epoch": 0.8, "learning_rate": 2.0629231210457136e-06, "loss": 1.1953, "step": 29224 }, { "epoch": 0.8, "learning_rate": 2.062385106937814e-06, "loss": 1.3174, "step": 29225 }, { "epoch": 0.8, "learning_rate": 2.0618471549300846e-06, "loss": 1.3313, "step": 29226 }, { "epoch": 0.8, "learning_rate": 2.0613092650267274e-06, "loss": 1.311, "step": 29227 }, { "epoch": 0.8, "learning_rate": 2.06077143723196e-06, "loss": 1.394, "step": 29228 }, { "epoch": 0.8, "learning_rate": 2.060233671549976e-06, "loss": 1.3562, "step": 29229 }, { "epoch": 0.8, "learning_rate": 2.059695967984995e-06, "loss": 1.291, "step": 29230 }, { "epoch": 0.8, "learning_rate": 2.059158326541215e-06, "loss": 1.3899, "step": 29231 }, { "epoch": 0.8, "learning_rate": 2.0586207472228515e-06, "loss": 1.3252, "step": 29232 }, { "epoch": 0.8, "learning_rate": 2.0580832300341005e-06, "loss": 1.1472, "step": 29233 }, { "epoch": 0.8, "learning_rate": 2.057545774979174e-06, "loss": 1.2493, "step": 29234 }, { "epoch": 0.8, "learning_rate": 2.057008382062271e-06, "loss": 1.2644, "step": 29235 }, { "epoch": 0.8, "learning_rate": 2.056471051287603e-06, "loss": 1.0107, "step": 29236 }, { "epoch": 0.8, "learning_rate": 2.0559337826593707e-06, "loss": 1.2031, "step": 29237 }, { "epoch": 0.8, "learning_rate": 2.055396576181773e-06, "loss": 1.1382, "step": 29238 }, { "epoch": 0.8, "learning_rate": 2.0548594318590196e-06, "loss": 1.3079, "step": 29239 }, { "epoch": 0.8, "learning_rate": 2.0543223496953103e-06, "loss": 1.0591, "step": 29240 }, { "epoch": 0.8, "learning_rate": 2.0537853296948463e-06, "loss": 1.2874, "step": 29241 }, { "epoch": 0.8, "learning_rate": 2.0532483718618267e-06, "loss": 1.3533, "step": 29242 }, { "epoch": 0.8, "learning_rate": 2.0527114762004584e-06, "loss": 1.1106, "step": 29243 }, { "epoch": 0.8, "learning_rate": 2.052174642714938e-06, "loss": 1.3938, "step": 29244 }, { "epoch": 0.8, "learning_rate": 2.0516378714094653e-06, "loss": 1.2754, "step": 29245 }, { "epoch": 0.8, "learning_rate": 2.051101162288238e-06, "loss": 1.1775, "step": 29246 }, { "epoch": 0.8, "learning_rate": 2.050564515355461e-06, "loss": 1.2983, "step": 29247 }, { "epoch": 0.8, "learning_rate": 2.050027930615328e-06, "loss": 1.1992, "step": 29248 }, { "epoch": 0.8, "learning_rate": 2.0494914080720387e-06, "loss": 1.2839, "step": 29249 }, { "epoch": 0.8, "learning_rate": 2.0489549477297866e-06, "loss": 1.3318, "step": 29250 }, { "epoch": 0.8, "learning_rate": 2.0484185495927757e-06, "loss": 1.114, "step": 29251 }, { "epoch": 0.8, "learning_rate": 2.0478822136651988e-06, "loss": 1.345, "step": 29252 }, { "epoch": 0.8, "learning_rate": 2.0473459399512487e-06, "loss": 1.0546, "step": 29253 }, { "epoch": 0.8, "learning_rate": 2.046809728455128e-06, "loss": 1.2803, "step": 29254 }, { "epoch": 0.8, "learning_rate": 2.0462735791810272e-06, "loss": 1.1904, "step": 29255 }, { "epoch": 0.8, "learning_rate": 2.045737492133142e-06, "loss": 1.387, "step": 29256 }, { "epoch": 0.8, "learning_rate": 2.045201467315664e-06, "loss": 1.281, "step": 29257 }, { "epoch": 0.8, "learning_rate": 2.0446655047327922e-06, "loss": 1.1687, "step": 29258 }, { "epoch": 0.8, "learning_rate": 2.044129604388716e-06, "loss": 1.3354, "step": 29259 }, { "epoch": 0.8, "learning_rate": 2.0435937662876294e-06, "loss": 1.4312, "step": 29260 }, { "epoch": 0.8, "learning_rate": 2.04305799043372e-06, "loss": 1.3562, "step": 29261 }, { "epoch": 0.8, "learning_rate": 2.042522276831186e-06, "loss": 1.1807, "step": 29262 }, { "epoch": 0.8, "learning_rate": 2.0419866254842167e-06, "loss": 1.2053, "step": 29263 }, { "epoch": 0.8, "learning_rate": 2.041451036397002e-06, "loss": 1.2476, "step": 29264 }, { "epoch": 0.8, "learning_rate": 2.040915509573729e-06, "loss": 1.2571, "step": 29265 }, { "epoch": 0.8, "learning_rate": 2.0403800450185897e-06, "loss": 1.3201, "step": 29266 }, { "epoch": 0.8, "learning_rate": 2.0398446427357797e-06, "loss": 1.1536, "step": 29267 }, { "epoch": 0.8, "learning_rate": 2.0393093027294777e-06, "loss": 1.1519, "step": 29268 }, { "epoch": 0.8, "learning_rate": 2.0387740250038777e-06, "loss": 1.0923, "step": 29269 }, { "epoch": 0.8, "learning_rate": 2.0382388095631646e-06, "loss": 1.3901, "step": 29270 }, { "epoch": 0.8, "learning_rate": 2.0377036564115315e-06, "loss": 1.3948, "step": 29271 }, { "epoch": 0.8, "learning_rate": 2.037168565553156e-06, "loss": 1.3821, "step": 29272 }, { "epoch": 0.8, "learning_rate": 2.036633536992232e-06, "loss": 1.3005, "step": 29273 }, { "epoch": 0.8, "learning_rate": 2.0360985707329393e-06, "loss": 1.2146, "step": 29274 }, { "epoch": 0.8, "learning_rate": 2.0355636667794733e-06, "loss": 1.22, "step": 29275 }, { "epoch": 0.8, "learning_rate": 2.035028825136005e-06, "loss": 1.2993, "step": 29276 }, { "epoch": 0.8, "learning_rate": 2.03449404580673e-06, "loss": 1.2163, "step": 29277 }, { "epoch": 0.8, "learning_rate": 2.0339593287958236e-06, "loss": 1.3005, "step": 29278 }, { "epoch": 0.8, "learning_rate": 2.0334246741074802e-06, "loss": 1.1423, "step": 29279 }, { "epoch": 0.8, "learning_rate": 2.032890081745871e-06, "loss": 1.248, "step": 29280 }, { "epoch": 0.8, "learning_rate": 2.0323555517151817e-06, "loss": 1.2913, "step": 29281 }, { "epoch": 0.8, "learning_rate": 2.0318210840195995e-06, "loss": 1.0024, "step": 29282 }, { "epoch": 0.8, "learning_rate": 2.0312866786633023e-06, "loss": 1.2654, "step": 29283 }, { "epoch": 0.8, "learning_rate": 2.030752335650471e-06, "loss": 1.4927, "step": 29284 }, { "epoch": 0.8, "learning_rate": 2.0302180549852837e-06, "loss": 1.2983, "step": 29285 }, { "epoch": 0.8, "learning_rate": 2.029683836671924e-06, "loss": 1.22, "step": 29286 }, { "epoch": 0.8, "learning_rate": 2.029149680714572e-06, "loss": 1.3137, "step": 29287 }, { "epoch": 0.8, "learning_rate": 2.028615587117403e-06, "loss": 1.2957, "step": 29288 }, { "epoch": 0.8, "learning_rate": 2.0280815558845957e-06, "loss": 1.249, "step": 29289 }, { "epoch": 0.8, "learning_rate": 2.027547587020332e-06, "loss": 1.3953, "step": 29290 }, { "epoch": 0.8, "learning_rate": 2.0270136805287865e-06, "loss": 1.2524, "step": 29291 }, { "epoch": 0.8, "learning_rate": 2.026479836414137e-06, "loss": 1.3582, "step": 29292 }, { "epoch": 0.8, "learning_rate": 2.0259460546805574e-06, "loss": 1.4011, "step": 29293 }, { "epoch": 0.8, "learning_rate": 2.0254123353322284e-06, "loss": 1.2458, "step": 29294 }, { "epoch": 0.8, "learning_rate": 2.0248786783733245e-06, "loss": 1.3589, "step": 29295 }, { "epoch": 0.8, "learning_rate": 2.024345083808019e-06, "loss": 1.1748, "step": 29296 }, { "epoch": 0.8, "learning_rate": 2.0238115516404845e-06, "loss": 1.2605, "step": 29297 }, { "epoch": 0.8, "learning_rate": 2.023278081874901e-06, "loss": 1.2761, "step": 29298 }, { "epoch": 0.8, "learning_rate": 2.022744674515438e-06, "loss": 1.2764, "step": 29299 }, { "epoch": 0.8, "learning_rate": 2.022211329566267e-06, "loss": 1.311, "step": 29300 }, { "epoch": 0.8, "learning_rate": 2.0216780470315657e-06, "loss": 1.2566, "step": 29301 }, { "epoch": 0.8, "learning_rate": 2.0211448269155043e-06, "loss": 1.2271, "step": 29302 }, { "epoch": 0.8, "learning_rate": 2.0206116692222535e-06, "loss": 1.1689, "step": 29303 }, { "epoch": 0.8, "learning_rate": 2.0200785739559813e-06, "loss": 1.1846, "step": 29304 }, { "epoch": 0.8, "learning_rate": 2.0195455411208663e-06, "loss": 1.3213, "step": 29305 }, { "epoch": 0.8, "learning_rate": 2.019012570721073e-06, "loss": 1.2751, "step": 29306 }, { "epoch": 0.8, "learning_rate": 2.0184796627607728e-06, "loss": 1.3389, "step": 29307 }, { "epoch": 0.8, "learning_rate": 2.017946817244132e-06, "loss": 1.3469, "step": 29308 }, { "epoch": 0.8, "learning_rate": 2.0174140341753246e-06, "loss": 1.2749, "step": 29309 }, { "epoch": 0.8, "learning_rate": 2.016881313558516e-06, "loss": 1.3765, "step": 29310 }, { "epoch": 0.8, "learning_rate": 2.016348655397874e-06, "loss": 1.3882, "step": 29311 }, { "epoch": 0.8, "learning_rate": 2.0158160596975627e-06, "loss": 1.6694, "step": 29312 }, { "epoch": 0.8, "learning_rate": 2.015283526461753e-06, "loss": 1.322, "step": 29313 }, { "epoch": 0.8, "learning_rate": 2.014751055694616e-06, "loss": 1.3123, "step": 29314 }, { "epoch": 0.8, "learning_rate": 2.0142186474003058e-06, "loss": 1.2146, "step": 29315 }, { "epoch": 0.8, "learning_rate": 2.0136863015829967e-06, "loss": 1.1851, "step": 29316 }, { "epoch": 0.8, "learning_rate": 2.0131540182468478e-06, "loss": 1.2925, "step": 29317 }, { "epoch": 0.8, "learning_rate": 2.0126217973960305e-06, "loss": 1.2812, "step": 29318 }, { "epoch": 0.8, "learning_rate": 2.0120896390347e-06, "loss": 1.3257, "step": 29319 }, { "epoch": 0.8, "learning_rate": 2.0115575431670266e-06, "loss": 1.2368, "step": 29320 }, { "epoch": 0.8, "learning_rate": 2.0110255097971677e-06, "loss": 1.4297, "step": 29321 }, { "epoch": 0.8, "learning_rate": 2.0104935389292944e-06, "loss": 1.2261, "step": 29322 }, { "epoch": 0.8, "learning_rate": 2.009961630567557e-06, "loss": 1.3433, "step": 29323 }, { "epoch": 0.8, "learning_rate": 2.0094297847161247e-06, "loss": 1.2283, "step": 29324 }, { "epoch": 0.8, "learning_rate": 2.0088980013791546e-06, "loss": 1.3257, "step": 29325 }, { "epoch": 0.8, "learning_rate": 2.008366280560814e-06, "loss": 1.2678, "step": 29326 }, { "epoch": 0.8, "learning_rate": 2.0078346222652523e-06, "loss": 1.4026, "step": 29327 }, { "epoch": 0.8, "learning_rate": 2.007303026496634e-06, "loss": 1.3999, "step": 29328 }, { "epoch": 0.8, "learning_rate": 2.0067714932591208e-06, "loss": 1.2903, "step": 29329 }, { "epoch": 0.8, "learning_rate": 2.00624002255687e-06, "loss": 1.2107, "step": 29330 }, { "epoch": 0.8, "learning_rate": 2.0057086143940374e-06, "loss": 1.248, "step": 29331 }, { "epoch": 0.8, "learning_rate": 2.0051772687747785e-06, "loss": 1.208, "step": 29332 }, { "epoch": 0.8, "learning_rate": 2.0046459857032564e-06, "loss": 1.2849, "step": 29333 }, { "epoch": 0.8, "learning_rate": 2.0041147651836246e-06, "loss": 1.2139, "step": 29334 }, { "epoch": 0.8, "learning_rate": 2.003583607220039e-06, "loss": 1.2593, "step": 29335 }, { "epoch": 0.8, "learning_rate": 2.003052511816651e-06, "loss": 1.3494, "step": 29336 }, { "epoch": 0.8, "learning_rate": 2.002521478977624e-06, "loss": 1.324, "step": 29337 }, { "epoch": 0.8, "learning_rate": 2.0019905087071077e-06, "loss": 1.2219, "step": 29338 }, { "epoch": 0.8, "learning_rate": 2.001459601009257e-06, "loss": 1.0415, "step": 29339 }, { "epoch": 0.8, "learning_rate": 2.0009287558882216e-06, "loss": 1.311, "step": 29340 }, { "epoch": 0.8, "learning_rate": 2.0003979733481616e-06, "loss": 1.228, "step": 29341 }, { "epoch": 0.8, "learning_rate": 1.9998672533932264e-06, "loss": 1.1536, "step": 29342 }, { "epoch": 0.8, "learning_rate": 1.9993365960275644e-06, "loss": 1.2104, "step": 29343 }, { "epoch": 0.8, "learning_rate": 1.9988060012553346e-06, "loss": 1.1658, "step": 29344 }, { "epoch": 0.8, "learning_rate": 1.998275469080684e-06, "loss": 1.333, "step": 29345 }, { "epoch": 0.8, "learning_rate": 1.9977449995077626e-06, "loss": 1.2212, "step": 29346 }, { "epoch": 0.8, "learning_rate": 1.9972145925407193e-06, "loss": 1.1055, "step": 29347 }, { "epoch": 0.8, "learning_rate": 1.996684248183708e-06, "loss": 1.3882, "step": 29348 }, { "epoch": 0.8, "learning_rate": 1.9961539664408757e-06, "loss": 1.1021, "step": 29349 }, { "epoch": 0.8, "learning_rate": 1.995623747316372e-06, "loss": 1.2244, "step": 29350 }, { "epoch": 0.8, "learning_rate": 1.995093590814341e-06, "loss": 1.144, "step": 29351 }, { "epoch": 0.8, "learning_rate": 1.994563496938936e-06, "loss": 1.1362, "step": 29352 }, { "epoch": 0.8, "learning_rate": 1.9940334656943015e-06, "loss": 1.2319, "step": 29353 }, { "epoch": 0.8, "learning_rate": 1.9935034970845855e-06, "loss": 1.1431, "step": 29354 }, { "epoch": 0.8, "learning_rate": 1.9929735911139304e-06, "loss": 1.1904, "step": 29355 }, { "epoch": 0.8, "learning_rate": 1.9924437477864868e-06, "loss": 1.1104, "step": 29356 }, { "epoch": 0.8, "learning_rate": 1.9919139671063982e-06, "loss": 1.4277, "step": 29357 }, { "epoch": 0.8, "learning_rate": 1.991384249077809e-06, "loss": 1.3296, "step": 29358 }, { "epoch": 0.8, "learning_rate": 1.990854593704861e-06, "loss": 1.3718, "step": 29359 }, { "epoch": 0.8, "learning_rate": 1.9903250009916997e-06, "loss": 1.323, "step": 29360 }, { "epoch": 0.8, "learning_rate": 1.989795470942475e-06, "loss": 1.4385, "step": 29361 }, { "epoch": 0.8, "learning_rate": 1.9892660035613188e-06, "loss": 1.2678, "step": 29362 }, { "epoch": 0.8, "learning_rate": 1.9887365988523812e-06, "loss": 1.2202, "step": 29363 }, { "epoch": 0.8, "learning_rate": 1.9882072568197987e-06, "loss": 1.1675, "step": 29364 }, { "epoch": 0.8, "learning_rate": 1.9876779774677203e-06, "loss": 1.1509, "step": 29365 }, { "epoch": 0.8, "learning_rate": 1.987148760800276e-06, "loss": 1.1221, "step": 29366 }, { "epoch": 0.8, "learning_rate": 1.9866196068216147e-06, "loss": 1.2439, "step": 29367 }, { "epoch": 0.8, "learning_rate": 1.986090515535871e-06, "loss": 1.2273, "step": 29368 }, { "epoch": 0.8, "learning_rate": 1.985561486947193e-06, "loss": 1.2903, "step": 29369 }, { "epoch": 0.8, "learning_rate": 1.9850325210597067e-06, "loss": 1.2869, "step": 29370 }, { "epoch": 0.8, "learning_rate": 1.98450361787756e-06, "loss": 1.3413, "step": 29371 }, { "epoch": 0.8, "learning_rate": 1.983974777404886e-06, "loss": 1.3469, "step": 29372 }, { "epoch": 0.8, "learning_rate": 1.983445999645828e-06, "loss": 1.2456, "step": 29373 }, { "epoch": 0.8, "learning_rate": 1.982917284604514e-06, "loss": 1.3611, "step": 29374 }, { "epoch": 0.8, "learning_rate": 1.9823886322850847e-06, "loss": 1.2144, "step": 29375 }, { "epoch": 0.8, "learning_rate": 1.98186004269168e-06, "loss": 1.1111, "step": 29376 }, { "epoch": 0.8, "learning_rate": 1.9813315158284317e-06, "loss": 1.2839, "step": 29377 }, { "epoch": 0.8, "learning_rate": 1.980803051699476e-06, "loss": 1.2498, "step": 29378 }, { "epoch": 0.8, "learning_rate": 1.980274650308942e-06, "loss": 1.1375, "step": 29379 }, { "epoch": 0.8, "learning_rate": 1.979746311660972e-06, "loss": 1.291, "step": 29380 }, { "epoch": 0.8, "learning_rate": 1.9792180357596945e-06, "loss": 1.1547, "step": 29381 }, { "epoch": 0.8, "learning_rate": 1.978689822609243e-06, "loss": 1.1973, "step": 29382 }, { "epoch": 0.8, "learning_rate": 1.97816167221375e-06, "loss": 1.7441, "step": 29383 }, { "epoch": 0.8, "learning_rate": 1.977633584577349e-06, "loss": 1.3167, "step": 29384 }, { "epoch": 0.8, "learning_rate": 1.97710555970417e-06, "loss": 1.2139, "step": 29385 }, { "epoch": 0.8, "learning_rate": 1.9765775975983447e-06, "loss": 1.283, "step": 29386 }, { "epoch": 0.8, "learning_rate": 1.9760496982640023e-06, "loss": 1.2332, "step": 29387 }, { "epoch": 0.8, "learning_rate": 1.975521861705275e-06, "loss": 1.2722, "step": 29388 }, { "epoch": 0.8, "learning_rate": 1.974994087926292e-06, "loss": 1.1804, "step": 29389 }, { "epoch": 0.8, "learning_rate": 1.974466376931178e-06, "loss": 1.1746, "step": 29390 }, { "epoch": 0.8, "learning_rate": 1.9739387287240685e-06, "loss": 1.1843, "step": 29391 }, { "epoch": 0.8, "learning_rate": 1.9734111433090886e-06, "loss": 1.2417, "step": 29392 }, { "epoch": 0.8, "learning_rate": 1.972883620690366e-06, "loss": 1.2017, "step": 29393 }, { "epoch": 0.8, "learning_rate": 1.972356160872023e-06, "loss": 1.2815, "step": 29394 }, { "epoch": 0.8, "learning_rate": 1.9718287638581945e-06, "loss": 1.2986, "step": 29395 }, { "epoch": 0.8, "learning_rate": 1.971301429653002e-06, "loss": 1.3052, "step": 29396 }, { "epoch": 0.8, "learning_rate": 1.9707741582605722e-06, "loss": 1.3633, "step": 29397 }, { "epoch": 0.8, "learning_rate": 1.970246949685026e-06, "loss": 1.3582, "step": 29398 }, { "epoch": 0.8, "learning_rate": 1.9697198039304965e-06, "loss": 1.2727, "step": 29399 }, { "epoch": 0.8, "learning_rate": 1.969192721001102e-06, "loss": 1.033, "step": 29400 }, { "epoch": 0.8, "learning_rate": 1.968665700900967e-06, "loss": 1.3276, "step": 29401 }, { "epoch": 0.8, "learning_rate": 1.9681387436342124e-06, "loss": 1.2593, "step": 29402 }, { "epoch": 0.8, "learning_rate": 1.967611849204967e-06, "loss": 1.1328, "step": 29403 }, { "epoch": 0.8, "learning_rate": 1.9670850176173485e-06, "loss": 1.3257, "step": 29404 }, { "epoch": 0.8, "learning_rate": 1.9665582488754777e-06, "loss": 1.1958, "step": 29405 }, { "epoch": 0.8, "learning_rate": 1.9660315429834787e-06, "loss": 1.3452, "step": 29406 }, { "epoch": 0.8, "learning_rate": 1.9655048999454693e-06, "loss": 1.2212, "step": 29407 }, { "epoch": 0.8, "learning_rate": 1.964978319765577e-06, "loss": 1.28, "step": 29408 }, { "epoch": 0.8, "learning_rate": 1.964451802447911e-06, "loss": 1.1152, "step": 29409 }, { "epoch": 0.8, "learning_rate": 1.963925347996597e-06, "loss": 1.175, "step": 29410 }, { "epoch": 0.8, "learning_rate": 1.9633989564157506e-06, "loss": 1.2256, "step": 29411 }, { "epoch": 0.8, "learning_rate": 1.9628726277094966e-06, "loss": 1.2988, "step": 29412 }, { "epoch": 0.8, "learning_rate": 1.9623463618819427e-06, "loss": 1.2371, "step": 29413 }, { "epoch": 0.8, "learning_rate": 1.9618201589372132e-06, "loss": 1.343, "step": 29414 }, { "epoch": 0.8, "learning_rate": 1.9612940188794217e-06, "loss": 1.2512, "step": 29415 }, { "epoch": 0.8, "learning_rate": 1.96076794171269e-06, "loss": 1.2319, "step": 29416 }, { "epoch": 0.8, "learning_rate": 1.960241927441124e-06, "loss": 1.2688, "step": 29417 }, { "epoch": 0.8, "learning_rate": 1.9597159760688477e-06, "loss": 1.2761, "step": 29418 }, { "epoch": 0.8, "learning_rate": 1.9591900875999703e-06, "loss": 1.104, "step": 29419 }, { "epoch": 0.8, "learning_rate": 1.9586642620386143e-06, "loss": 1.0356, "step": 29420 }, { "epoch": 0.8, "learning_rate": 1.958138499388882e-06, "loss": 1.229, "step": 29421 }, { "epoch": 0.8, "learning_rate": 1.957612799654892e-06, "loss": 1.1777, "step": 29422 }, { "epoch": 0.8, "learning_rate": 1.9570871628407616e-06, "loss": 1.2517, "step": 29423 }, { "epoch": 0.8, "learning_rate": 1.9565615889505984e-06, "loss": 1.1145, "step": 29424 }, { "epoch": 0.8, "learning_rate": 1.9560360779885157e-06, "loss": 1.4624, "step": 29425 }, { "epoch": 0.8, "learning_rate": 1.9555106299586203e-06, "loss": 1.2666, "step": 29426 }, { "epoch": 0.8, "learning_rate": 1.954985244865031e-06, "loss": 1.1729, "step": 29427 }, { "epoch": 0.8, "learning_rate": 1.9544599227118535e-06, "loss": 1.1926, "step": 29428 }, { "epoch": 0.8, "learning_rate": 1.9539346635031974e-06, "loss": 1.1675, "step": 29429 }, { "epoch": 0.8, "learning_rate": 1.9534094672431712e-06, "loss": 1.1265, "step": 29430 }, { "epoch": 0.8, "learning_rate": 1.952884333935888e-06, "loss": 1.3853, "step": 29431 }, { "epoch": 0.8, "learning_rate": 1.9523592635854538e-06, "loss": 1.2607, "step": 29432 }, { "epoch": 0.8, "learning_rate": 1.951834256195977e-06, "loss": 1.2314, "step": 29433 }, { "epoch": 0.8, "learning_rate": 1.951309311771561e-06, "loss": 1.1929, "step": 29434 }, { "epoch": 0.8, "learning_rate": 1.9507844303163195e-06, "loss": 1.2212, "step": 29435 }, { "epoch": 0.8, "learning_rate": 1.9502596118343553e-06, "loss": 1.2356, "step": 29436 }, { "epoch": 0.8, "learning_rate": 1.9497348563297715e-06, "loss": 1.324, "step": 29437 }, { "epoch": 0.8, "learning_rate": 1.9492101638066795e-06, "loss": 1.3096, "step": 29438 }, { "epoch": 0.8, "learning_rate": 1.9486855342691823e-06, "loss": 1.2175, "step": 29439 }, { "epoch": 0.8, "learning_rate": 1.948160967721383e-06, "loss": 1.2305, "step": 29440 }, { "epoch": 0.8, "learning_rate": 1.947636464167383e-06, "loss": 1.1365, "step": 29441 }, { "epoch": 0.8, "learning_rate": 1.947112023611292e-06, "loss": 1.3594, "step": 29442 }, { "epoch": 0.8, "learning_rate": 1.94658764605721e-06, "loss": 1.2129, "step": 29443 }, { "epoch": 0.8, "learning_rate": 1.9460633315092383e-06, "loss": 1.4031, "step": 29444 }, { "epoch": 0.8, "learning_rate": 1.945539079971478e-06, "loss": 1.2063, "step": 29445 }, { "epoch": 0.8, "learning_rate": 1.945014891448035e-06, "loss": 1.3345, "step": 29446 }, { "epoch": 0.8, "learning_rate": 1.944490765943007e-06, "loss": 1.5061, "step": 29447 }, { "epoch": 0.8, "learning_rate": 1.9439667034604958e-06, "loss": 1.3892, "step": 29448 }, { "epoch": 0.8, "learning_rate": 1.9434427040045988e-06, "loss": 1.4155, "step": 29449 }, { "epoch": 0.8, "learning_rate": 1.94291876757942e-06, "loss": 1.3054, "step": 29450 }, { "epoch": 0.8, "learning_rate": 1.9423948941890558e-06, "loss": 1.2179, "step": 29451 }, { "epoch": 0.8, "learning_rate": 1.941871083837602e-06, "loss": 1.2756, "step": 29452 }, { "epoch": 0.8, "learning_rate": 1.9413473365291636e-06, "loss": 1.3489, "step": 29453 }, { "epoch": 0.8, "learning_rate": 1.9408236522678305e-06, "loss": 1.2495, "step": 29454 }, { "epoch": 0.8, "learning_rate": 1.940300031057706e-06, "loss": 1.4067, "step": 29455 }, { "epoch": 0.8, "learning_rate": 1.9397764729028844e-06, "loss": 1.1018, "step": 29456 }, { "epoch": 0.8, "learning_rate": 1.939252977807462e-06, "loss": 1.3989, "step": 29457 }, { "epoch": 0.8, "learning_rate": 1.9387295457755308e-06, "loss": 1.1721, "step": 29458 }, { "epoch": 0.8, "learning_rate": 1.9382061768111915e-06, "loss": 1.335, "step": 29459 }, { "epoch": 0.8, "learning_rate": 1.9376828709185357e-06, "loss": 1.2087, "step": 29460 }, { "epoch": 0.8, "learning_rate": 1.937159628101658e-06, "loss": 1.0894, "step": 29461 }, { "epoch": 0.8, "learning_rate": 1.9366364483646505e-06, "loss": 1.2373, "step": 29462 }, { "epoch": 0.8, "learning_rate": 1.93611333171161e-06, "loss": 1.1426, "step": 29463 }, { "epoch": 0.8, "learning_rate": 1.9355902781466263e-06, "loss": 1.3286, "step": 29464 }, { "epoch": 0.8, "learning_rate": 1.9350672876737918e-06, "loss": 1.3372, "step": 29465 }, { "epoch": 0.8, "learning_rate": 1.934544360297197e-06, "loss": 1.2422, "step": 29466 }, { "epoch": 0.8, "learning_rate": 1.9340214960209358e-06, "loss": 1.259, "step": 29467 }, { "epoch": 0.8, "learning_rate": 1.9334986948490988e-06, "loss": 1.3696, "step": 29468 }, { "epoch": 0.8, "learning_rate": 1.932975956785771e-06, "loss": 1.3008, "step": 29469 }, { "epoch": 0.8, "learning_rate": 1.9324532818350495e-06, "loss": 1.3647, "step": 29470 }, { "epoch": 0.8, "learning_rate": 1.93193067000102e-06, "loss": 1.2695, "step": 29471 }, { "epoch": 0.8, "learning_rate": 1.93140812128777e-06, "loss": 1.2925, "step": 29472 }, { "epoch": 0.8, "learning_rate": 1.9308856356993867e-06, "loss": 1.1887, "step": 29473 }, { "epoch": 0.8, "learning_rate": 1.930363213239963e-06, "loss": 1.2471, "step": 29474 }, { "epoch": 0.8, "learning_rate": 1.9298408539135826e-06, "loss": 1.1694, "step": 29475 }, { "epoch": 0.8, "learning_rate": 1.9293185577243324e-06, "loss": 1.2522, "step": 29476 }, { "epoch": 0.8, "learning_rate": 1.928796324676295e-06, "loss": 1.1335, "step": 29477 }, { "epoch": 0.81, "learning_rate": 1.928274154773564e-06, "loss": 1.3682, "step": 29478 }, { "epoch": 0.81, "learning_rate": 1.9277520480202205e-06, "loss": 1.314, "step": 29479 }, { "epoch": 0.81, "learning_rate": 1.9272300044203485e-06, "loss": 1.2908, "step": 29480 }, { "epoch": 0.81, "learning_rate": 1.92670802397803e-06, "loss": 1.2991, "step": 29481 }, { "epoch": 0.81, "learning_rate": 1.9261861066973543e-06, "loss": 1.239, "step": 29482 }, { "epoch": 0.81, "learning_rate": 1.925664252582402e-06, "loss": 1.3647, "step": 29483 }, { "epoch": 0.81, "learning_rate": 1.925142461637254e-06, "loss": 1.1436, "step": 29484 }, { "epoch": 0.81, "learning_rate": 1.924620733865995e-06, "loss": 1.3352, "step": 29485 }, { "epoch": 0.81, "learning_rate": 1.924099069272708e-06, "loss": 1.22, "step": 29486 }, { "epoch": 0.81, "learning_rate": 1.9235774678614717e-06, "loss": 1.179, "step": 29487 }, { "epoch": 0.81, "learning_rate": 1.923055929636364e-06, "loss": 1.3179, "step": 29488 }, { "epoch": 0.81, "learning_rate": 1.9225344546014722e-06, "loss": 1.2556, "step": 29489 }, { "epoch": 0.81, "learning_rate": 1.9220130427608694e-06, "loss": 1.3523, "step": 29490 }, { "epoch": 0.81, "learning_rate": 1.9214916941186446e-06, "loss": 1.4578, "step": 29491 }, { "epoch": 0.81, "learning_rate": 1.9209704086788627e-06, "loss": 1.3938, "step": 29492 }, { "epoch": 0.81, "learning_rate": 1.9204491864456132e-06, "loss": 1.2456, "step": 29493 }, { "epoch": 0.81, "learning_rate": 1.919928027422967e-06, "loss": 1.1382, "step": 29494 }, { "epoch": 0.81, "learning_rate": 1.91940693161501e-06, "loss": 1.2405, "step": 29495 }, { "epoch": 0.81, "learning_rate": 1.9188858990258084e-06, "loss": 1.3464, "step": 29496 }, { "epoch": 0.81, "learning_rate": 1.9183649296594455e-06, "loss": 1.3611, "step": 29497 }, { "epoch": 0.81, "learning_rate": 1.9178440235199925e-06, "loss": 1.3342, "step": 29498 }, { "epoch": 0.81, "learning_rate": 1.91732318061153e-06, "loss": 1.2214, "step": 29499 }, { "epoch": 0.81, "learning_rate": 1.9168024009381303e-06, "loss": 1.2749, "step": 29500 }, { "epoch": 0.81, "learning_rate": 1.916281684503866e-06, "loss": 1.2837, "step": 29501 }, { "epoch": 0.81, "learning_rate": 1.915761031312814e-06, "loss": 1.2605, "step": 29502 }, { "epoch": 0.81, "learning_rate": 1.9152404413690463e-06, "loss": 1.2659, "step": 29503 }, { "epoch": 0.81, "learning_rate": 1.914719914676636e-06, "loss": 1.2205, "step": 29504 }, { "epoch": 0.81, "learning_rate": 1.9141994512396524e-06, "loss": 1.6885, "step": 29505 }, { "epoch": 0.81, "learning_rate": 1.913679051062173e-06, "loss": 0.9857, "step": 29506 }, { "epoch": 0.81, "learning_rate": 1.9131587141482656e-06, "loss": 1.3108, "step": 29507 }, { "epoch": 0.81, "learning_rate": 1.9126384405020015e-06, "loss": 1.1846, "step": 29508 }, { "epoch": 0.81, "learning_rate": 1.91211823012745e-06, "loss": 1.4648, "step": 29509 }, { "epoch": 0.81, "learning_rate": 1.911598083028684e-06, "loss": 1.1569, "step": 29510 }, { "epoch": 0.81, "learning_rate": 1.9110779992097704e-06, "loss": 1.1953, "step": 29511 }, { "epoch": 0.81, "learning_rate": 1.910557978674781e-06, "loss": 1.3433, "step": 29512 }, { "epoch": 0.81, "learning_rate": 1.910038021427778e-06, "loss": 1.7778, "step": 29513 }, { "epoch": 0.81, "learning_rate": 1.9095181274728357e-06, "loss": 1.3271, "step": 29514 }, { "epoch": 0.81, "learning_rate": 1.90899829681402e-06, "loss": 1.186, "step": 29515 }, { "epoch": 0.81, "learning_rate": 1.9084785294553932e-06, "loss": 1.2678, "step": 29516 }, { "epoch": 0.81, "learning_rate": 1.9079588254010297e-06, "loss": 1.3311, "step": 29517 }, { "epoch": 0.81, "learning_rate": 1.90743918465499e-06, "loss": 1.2512, "step": 29518 }, { "epoch": 0.81, "learning_rate": 1.9069196072213413e-06, "loss": 1.1758, "step": 29519 }, { "epoch": 0.81, "learning_rate": 1.906400093104145e-06, "loss": 1.1775, "step": 29520 }, { "epoch": 0.81, "learning_rate": 1.9058806423074705e-06, "loss": 1.2507, "step": 29521 }, { "epoch": 0.81, "learning_rate": 1.9053612548353806e-06, "loss": 1.3267, "step": 29522 }, { "epoch": 0.81, "learning_rate": 1.9048419306919385e-06, "loss": 1.2959, "step": 29523 }, { "epoch": 0.81, "learning_rate": 1.9043226698812024e-06, "loss": 1.2356, "step": 29524 }, { "epoch": 0.81, "learning_rate": 1.903803472407243e-06, "loss": 1.1541, "step": 29525 }, { "epoch": 0.81, "learning_rate": 1.9032843382741172e-06, "loss": 1.2329, "step": 29526 }, { "epoch": 0.81, "learning_rate": 1.9027652674858877e-06, "loss": 1.1526, "step": 29527 }, { "epoch": 0.81, "learning_rate": 1.9022462600466119e-06, "loss": 1.1882, "step": 29528 }, { "epoch": 0.81, "learning_rate": 1.9017273159603543e-06, "loss": 1.2891, "step": 29529 }, { "epoch": 0.81, "learning_rate": 1.901208435231179e-06, "loss": 1.187, "step": 29530 }, { "epoch": 0.81, "learning_rate": 1.900689617863135e-06, "loss": 1.084, "step": 29531 }, { "epoch": 0.81, "learning_rate": 1.90017086386029e-06, "loss": 1.3145, "step": 29532 }, { "epoch": 0.81, "learning_rate": 1.899652173226697e-06, "loss": 1.2883, "step": 29533 }, { "epoch": 0.81, "learning_rate": 1.8991335459664205e-06, "loss": 1.2566, "step": 29534 }, { "epoch": 0.81, "learning_rate": 1.8986149820835099e-06, "loss": 1.3354, "step": 29535 }, { "epoch": 0.81, "learning_rate": 1.898096481582028e-06, "loss": 1.2017, "step": 29536 }, { "epoch": 0.81, "learning_rate": 1.8975780444660274e-06, "loss": 1.2253, "step": 29537 }, { "epoch": 0.81, "learning_rate": 1.8970596707395706e-06, "loss": 1.3362, "step": 29538 }, { "epoch": 0.81, "learning_rate": 1.896541360406704e-06, "loss": 1.1523, "step": 29539 }, { "epoch": 0.81, "learning_rate": 1.8960231134714901e-06, "loss": 1.2659, "step": 29540 }, { "epoch": 0.81, "learning_rate": 1.8955049299379768e-06, "loss": 1.2589, "step": 29541 }, { "epoch": 0.81, "learning_rate": 1.8949868098102287e-06, "loss": 1.304, "step": 29542 }, { "epoch": 0.81, "learning_rate": 1.8944687530922866e-06, "loss": 1.1553, "step": 29543 }, { "epoch": 0.81, "learning_rate": 1.8939507597882122e-06, "loss": 1.2717, "step": 29544 }, { "epoch": 0.81, "learning_rate": 1.893432829902052e-06, "loss": 1.4092, "step": 29545 }, { "epoch": 0.81, "learning_rate": 1.892914963437865e-06, "loss": 1.2002, "step": 29546 }, { "epoch": 0.81, "learning_rate": 1.8923971603996983e-06, "loss": 1.2908, "step": 29547 }, { "epoch": 0.81, "learning_rate": 1.8918794207916024e-06, "loss": 1.1667, "step": 29548 }, { "epoch": 0.81, "learning_rate": 1.8913617446176303e-06, "loss": 1.2749, "step": 29549 }, { "epoch": 0.81, "learning_rate": 1.8908441318818317e-06, "loss": 1.2725, "step": 29550 }, { "epoch": 0.81, "learning_rate": 1.8903265825882555e-06, "loss": 1.2761, "step": 29551 }, { "epoch": 0.81, "learning_rate": 1.8898090967409476e-06, "loss": 1.2124, "step": 29552 }, { "epoch": 0.81, "learning_rate": 1.8892916743439626e-06, "loss": 1.2722, "step": 29553 }, { "epoch": 0.81, "learning_rate": 1.888774315401346e-06, "loss": 1.6704, "step": 29554 }, { "epoch": 0.81, "learning_rate": 1.8882570199171447e-06, "loss": 1.313, "step": 29555 }, { "epoch": 0.81, "learning_rate": 1.887739787895403e-06, "loss": 1.1367, "step": 29556 }, { "epoch": 0.81, "learning_rate": 1.8872226193401732e-06, "loss": 1.2629, "step": 29557 }, { "epoch": 0.81, "learning_rate": 1.886705514255499e-06, "loss": 1.3181, "step": 29558 }, { "epoch": 0.81, "learning_rate": 1.8861884726454261e-06, "loss": 1.2083, "step": 29559 }, { "epoch": 0.81, "learning_rate": 1.8856714945139965e-06, "loss": 1.3186, "step": 29560 }, { "epoch": 0.81, "learning_rate": 1.8851545798652592e-06, "loss": 1.2817, "step": 29561 }, { "epoch": 0.81, "learning_rate": 1.884637728703258e-06, "loss": 1.1292, "step": 29562 }, { "epoch": 0.81, "learning_rate": 1.8841209410320315e-06, "loss": 1.2668, "step": 29563 }, { "epoch": 0.81, "learning_rate": 1.883604216855629e-06, "loss": 1.2861, "step": 29564 }, { "epoch": 0.81, "learning_rate": 1.8830875561780904e-06, "loss": 1.1689, "step": 29565 }, { "epoch": 0.81, "learning_rate": 1.882570959003459e-06, "loss": 1.2183, "step": 29566 }, { "epoch": 0.81, "learning_rate": 1.882054425335772e-06, "loss": 1.4309, "step": 29567 }, { "epoch": 0.81, "learning_rate": 1.8815379551790757e-06, "loss": 1.1614, "step": 29568 }, { "epoch": 0.81, "learning_rate": 1.8810215485374105e-06, "loss": 1.385, "step": 29569 }, { "epoch": 0.81, "learning_rate": 1.8805052054148132e-06, "loss": 1.2917, "step": 29570 }, { "epoch": 0.81, "learning_rate": 1.8799889258153236e-06, "loss": 1.3196, "step": 29571 }, { "epoch": 0.81, "learning_rate": 1.8794727097429844e-06, "loss": 1.3394, "step": 29572 }, { "epoch": 0.81, "learning_rate": 1.8789565572018331e-06, "loss": 1.325, "step": 29573 }, { "epoch": 0.81, "learning_rate": 1.8784404681959057e-06, "loss": 1.3723, "step": 29574 }, { "epoch": 0.81, "learning_rate": 1.8779244427292399e-06, "loss": 1.1455, "step": 29575 }, { "epoch": 0.81, "learning_rate": 1.8774084808058723e-06, "loss": 1.228, "step": 29576 }, { "epoch": 0.81, "learning_rate": 1.8768925824298478e-06, "loss": 1.2412, "step": 29577 }, { "epoch": 0.81, "learning_rate": 1.8763767476051898e-06, "loss": 1.2219, "step": 29578 }, { "epoch": 0.81, "learning_rate": 1.8758609763359437e-06, "loss": 1.2739, "step": 29579 }, { "epoch": 0.81, "learning_rate": 1.8753452686261375e-06, "loss": 1.1064, "step": 29580 }, { "epoch": 0.81, "learning_rate": 1.8748296244798149e-06, "loss": 1.155, "step": 29581 }, { "epoch": 0.81, "learning_rate": 1.874314043901e-06, "loss": 1.2954, "step": 29582 }, { "epoch": 0.81, "learning_rate": 1.8737985268937332e-06, "loss": 1.2122, "step": 29583 }, { "epoch": 0.81, "learning_rate": 1.8732830734620434e-06, "loss": 1.1365, "step": 29584 }, { "epoch": 0.81, "learning_rate": 1.8727676836099695e-06, "loss": 1.0078, "step": 29585 }, { "epoch": 0.81, "learning_rate": 1.8722523573415353e-06, "loss": 1.2664, "step": 29586 }, { "epoch": 0.81, "learning_rate": 1.8717370946607783e-06, "loss": 1.1379, "step": 29587 }, { "epoch": 0.81, "learning_rate": 1.8712218955717266e-06, "loss": 1.2273, "step": 29588 }, { "epoch": 0.81, "learning_rate": 1.8707067600784167e-06, "loss": 1.2312, "step": 29589 }, { "epoch": 0.81, "learning_rate": 1.8701916881848703e-06, "loss": 1.2634, "step": 29590 }, { "epoch": 0.81, "learning_rate": 1.8696766798951206e-06, "loss": 1.1562, "step": 29591 }, { "epoch": 0.81, "learning_rate": 1.8691617352131997e-06, "loss": 1.1628, "step": 29592 }, { "epoch": 0.81, "learning_rate": 1.8686468541431347e-06, "loss": 1.3276, "step": 29593 }, { "epoch": 0.81, "learning_rate": 1.8681320366889522e-06, "loss": 1.2148, "step": 29594 }, { "epoch": 0.81, "learning_rate": 1.867617282854679e-06, "loss": 1.2944, "step": 29595 }, { "epoch": 0.81, "learning_rate": 1.8671025926443464e-06, "loss": 1.2295, "step": 29596 }, { "epoch": 0.81, "learning_rate": 1.866587966061979e-06, "loss": 1.3186, "step": 29597 }, { "epoch": 0.81, "learning_rate": 1.8660734031116023e-06, "loss": 1.3057, "step": 29598 }, { "epoch": 0.81, "learning_rate": 1.86555890379724e-06, "loss": 1.2449, "step": 29599 }, { "epoch": 0.81, "learning_rate": 1.865044468122922e-06, "loss": 1.2732, "step": 29600 }, { "epoch": 0.81, "learning_rate": 1.8645300960926716e-06, "loss": 1.2583, "step": 29601 }, { "epoch": 0.81, "learning_rate": 1.8640157877105114e-06, "loss": 1.4624, "step": 29602 }, { "epoch": 0.81, "learning_rate": 1.8635015429804636e-06, "loss": 1.2336, "step": 29603 }, { "epoch": 0.81, "learning_rate": 1.8629873619065565e-06, "loss": 1.1001, "step": 29604 }, { "epoch": 0.81, "learning_rate": 1.8624732444928096e-06, "loss": 1.2351, "step": 29605 }, { "epoch": 0.81, "learning_rate": 1.8619591907432455e-06, "loss": 1.1626, "step": 29606 }, { "epoch": 0.81, "learning_rate": 1.8614452006618833e-06, "loss": 1.2095, "step": 29607 }, { "epoch": 0.81, "learning_rate": 1.8609312742527498e-06, "loss": 1.2628, "step": 29608 }, { "epoch": 0.81, "learning_rate": 1.8604174115198626e-06, "loss": 1.2478, "step": 29609 }, { "epoch": 0.81, "learning_rate": 1.8599036124672398e-06, "loss": 1.3364, "step": 29610 }, { "epoch": 0.81, "learning_rate": 1.859389877098905e-06, "loss": 1.3086, "step": 29611 }, { "epoch": 0.81, "learning_rate": 1.858876205418877e-06, "loss": 1.3125, "step": 29612 }, { "epoch": 0.81, "learning_rate": 1.8583625974311726e-06, "loss": 1.2239, "step": 29613 }, { "epoch": 0.81, "learning_rate": 1.8578490531398085e-06, "loss": 1.2593, "step": 29614 }, { "epoch": 0.81, "learning_rate": 1.8573355725488063e-06, "loss": 1.114, "step": 29615 }, { "epoch": 0.81, "learning_rate": 1.8568221556621824e-06, "loss": 1.3916, "step": 29616 }, { "epoch": 0.81, "learning_rate": 1.8563088024839538e-06, "loss": 1.1248, "step": 29617 }, { "epoch": 0.81, "learning_rate": 1.8557955130181316e-06, "loss": 1.3208, "step": 29618 }, { "epoch": 0.81, "learning_rate": 1.8552822872687393e-06, "loss": 1.0061, "step": 29619 }, { "epoch": 0.81, "learning_rate": 1.8547691252397871e-06, "loss": 1.7642, "step": 29620 }, { "epoch": 0.81, "learning_rate": 1.8542560269352926e-06, "loss": 1.2371, "step": 29621 }, { "epoch": 0.81, "learning_rate": 1.8537429923592655e-06, "loss": 1.2041, "step": 29622 }, { "epoch": 0.81, "learning_rate": 1.8532300215157218e-06, "loss": 1.2788, "step": 29623 }, { "epoch": 0.81, "learning_rate": 1.8527171144086808e-06, "loss": 1.3352, "step": 29624 }, { "epoch": 0.81, "learning_rate": 1.8522042710421462e-06, "loss": 1.4028, "step": 29625 }, { "epoch": 0.81, "learning_rate": 1.8516914914201357e-06, "loss": 1.2625, "step": 29626 }, { "epoch": 0.81, "learning_rate": 1.851178775546656e-06, "loss": 1.23, "step": 29627 }, { "epoch": 0.81, "learning_rate": 1.8506661234257285e-06, "loss": 1.3225, "step": 29628 }, { "epoch": 0.81, "learning_rate": 1.8501535350613508e-06, "loss": 1.2544, "step": 29629 }, { "epoch": 0.81, "learning_rate": 1.8496410104575424e-06, "loss": 1.6392, "step": 29630 }, { "epoch": 0.81, "learning_rate": 1.8491285496183075e-06, "loss": 1.2979, "step": 29631 }, { "epoch": 0.81, "learning_rate": 1.848616152547663e-06, "loss": 1.3179, "step": 29632 }, { "epoch": 0.81, "learning_rate": 1.848103819249608e-06, "loss": 1.2437, "step": 29633 }, { "epoch": 0.81, "learning_rate": 1.8475915497281583e-06, "loss": 1.3325, "step": 29634 }, { "epoch": 0.81, "learning_rate": 1.8470793439873158e-06, "loss": 1.3386, "step": 29635 }, { "epoch": 0.81, "learning_rate": 1.8465672020310955e-06, "loss": 1.3328, "step": 29636 }, { "epoch": 0.81, "learning_rate": 1.846055123863494e-06, "loss": 1.3765, "step": 29637 }, { "epoch": 0.81, "learning_rate": 1.8455431094885234e-06, "loss": 1.1104, "step": 29638 }, { "epoch": 0.81, "learning_rate": 1.845031158910192e-06, "loss": 1.3206, "step": 29639 }, { "epoch": 0.81, "learning_rate": 1.8445192721325023e-06, "loss": 1.2991, "step": 29640 }, { "epoch": 0.81, "learning_rate": 1.8440074491594585e-06, "loss": 1.3772, "step": 29641 }, { "epoch": 0.81, "learning_rate": 1.8434956899950618e-06, "loss": 1.137, "step": 29642 }, { "epoch": 0.81, "learning_rate": 1.8429839946433225e-06, "loss": 1.2776, "step": 29643 }, { "epoch": 0.81, "learning_rate": 1.8424723631082408e-06, "loss": 1.3628, "step": 29644 }, { "epoch": 0.81, "learning_rate": 1.84196079539382e-06, "loss": 1.2805, "step": 29645 }, { "epoch": 0.81, "learning_rate": 1.8414492915040583e-06, "loss": 1.2444, "step": 29646 }, { "epoch": 0.81, "learning_rate": 1.8409378514429644e-06, "loss": 1.6875, "step": 29647 }, { "epoch": 0.81, "learning_rate": 1.840426475214535e-06, "loss": 1.2188, "step": 29648 }, { "epoch": 0.81, "learning_rate": 1.839915162822772e-06, "loss": 1.084, "step": 29649 }, { "epoch": 0.81, "learning_rate": 1.8394039142716735e-06, "loss": 1.1694, "step": 29650 }, { "epoch": 0.81, "learning_rate": 1.8388927295652449e-06, "loss": 1.0859, "step": 29651 }, { "epoch": 0.81, "learning_rate": 1.83838160870748e-06, "loss": 1.2327, "step": 29652 }, { "epoch": 0.81, "learning_rate": 1.8378705517023788e-06, "loss": 1.3059, "step": 29653 }, { "epoch": 0.81, "learning_rate": 1.8373595585539416e-06, "loss": 1.3176, "step": 29654 }, { "epoch": 0.81, "learning_rate": 1.8368486292661657e-06, "loss": 1.214, "step": 29655 }, { "epoch": 0.81, "learning_rate": 1.8363377638430468e-06, "loss": 1.2566, "step": 29656 }, { "epoch": 0.81, "learning_rate": 1.8358269622885806e-06, "loss": 1.3433, "step": 29657 }, { "epoch": 0.81, "learning_rate": 1.8353162246067668e-06, "loss": 1.2664, "step": 29658 }, { "epoch": 0.81, "learning_rate": 1.8348055508016004e-06, "loss": 1.2617, "step": 29659 }, { "epoch": 0.81, "learning_rate": 1.834294940877075e-06, "loss": 1.3003, "step": 29660 }, { "epoch": 0.81, "learning_rate": 1.8337843948371848e-06, "loss": 1.4434, "step": 29661 }, { "epoch": 0.81, "learning_rate": 1.8332739126859268e-06, "loss": 1.2764, "step": 29662 }, { "epoch": 0.81, "learning_rate": 1.8327634944272942e-06, "loss": 1.2417, "step": 29663 }, { "epoch": 0.81, "learning_rate": 1.8322531400652798e-06, "loss": 1.1604, "step": 29664 }, { "epoch": 0.81, "learning_rate": 1.8317428496038725e-06, "loss": 1.4099, "step": 29665 }, { "epoch": 0.81, "learning_rate": 1.8312326230470711e-06, "loss": 1.304, "step": 29666 }, { "epoch": 0.81, "learning_rate": 1.830722460398865e-06, "loss": 1.1377, "step": 29667 }, { "epoch": 0.81, "learning_rate": 1.830212361663245e-06, "loss": 1.344, "step": 29668 }, { "epoch": 0.81, "learning_rate": 1.8297023268441981e-06, "loss": 1.3459, "step": 29669 }, { "epoch": 0.81, "learning_rate": 1.8291923559457192e-06, "loss": 1.2717, "step": 29670 }, { "epoch": 0.81, "learning_rate": 1.8286824489718024e-06, "loss": 1.3212, "step": 29671 }, { "epoch": 0.81, "learning_rate": 1.828172605926426e-06, "loss": 1.3083, "step": 29672 }, { "epoch": 0.81, "learning_rate": 1.8276628268135865e-06, "loss": 1.2986, "step": 29673 }, { "epoch": 0.81, "learning_rate": 1.8271531116372687e-06, "loss": 1.324, "step": 29674 }, { "epoch": 0.81, "learning_rate": 1.826643460401466e-06, "loss": 1.2407, "step": 29675 }, { "epoch": 0.81, "learning_rate": 1.8261338731101574e-06, "loss": 1.3682, "step": 29676 }, { "epoch": 0.81, "learning_rate": 1.8256243497673355e-06, "loss": 1.1863, "step": 29677 }, { "epoch": 0.81, "learning_rate": 1.825114890376982e-06, "loss": 1.2312, "step": 29678 }, { "epoch": 0.81, "learning_rate": 1.8246054949430915e-06, "loss": 1.2637, "step": 29679 }, { "epoch": 0.81, "learning_rate": 1.8240961634696387e-06, "loss": 1.3152, "step": 29680 }, { "epoch": 0.81, "learning_rate": 1.823586895960614e-06, "loss": 1.2395, "step": 29681 }, { "epoch": 0.81, "learning_rate": 1.8230776924199989e-06, "loss": 1.3835, "step": 29682 }, { "epoch": 0.81, "learning_rate": 1.8225685528517833e-06, "loss": 1.23, "step": 29683 }, { "epoch": 0.81, "learning_rate": 1.822059477259942e-06, "loss": 1.4163, "step": 29684 }, { "epoch": 0.81, "learning_rate": 1.8215504656484605e-06, "loss": 1.2112, "step": 29685 }, { "epoch": 0.81, "learning_rate": 1.8210415180213258e-06, "loss": 1.416, "step": 29686 }, { "epoch": 0.81, "learning_rate": 1.8205326343825158e-06, "loss": 1.2539, "step": 29687 }, { "epoch": 0.81, "learning_rate": 1.8200238147360127e-06, "loss": 1.2297, "step": 29688 }, { "epoch": 0.81, "learning_rate": 1.8195150590857934e-06, "loss": 1.2131, "step": 29689 }, { "epoch": 0.81, "learning_rate": 1.8190063674358448e-06, "loss": 1.3625, "step": 29690 }, { "epoch": 0.81, "learning_rate": 1.8184977397901437e-06, "loss": 1.1548, "step": 29691 }, { "epoch": 0.81, "learning_rate": 1.8179891761526691e-06, "loss": 1.2776, "step": 29692 }, { "epoch": 0.81, "learning_rate": 1.8174806765273968e-06, "loss": 1.2856, "step": 29693 }, { "epoch": 0.81, "learning_rate": 1.81697224091831e-06, "loss": 1.3008, "step": 29694 }, { "epoch": 0.81, "learning_rate": 1.8164638693293847e-06, "loss": 1.2075, "step": 29695 }, { "epoch": 0.81, "learning_rate": 1.8159555617645985e-06, "loss": 1.6929, "step": 29696 }, { "epoch": 0.81, "learning_rate": 1.8154473182279242e-06, "loss": 1.1509, "step": 29697 }, { "epoch": 0.81, "learning_rate": 1.814939138723345e-06, "loss": 1.1477, "step": 29698 }, { "epoch": 0.81, "learning_rate": 1.8144310232548323e-06, "loss": 1.1267, "step": 29699 }, { "epoch": 0.81, "learning_rate": 1.8139229718263595e-06, "loss": 1.2002, "step": 29700 }, { "epoch": 0.81, "learning_rate": 1.8134149844419068e-06, "loss": 1.2693, "step": 29701 }, { "epoch": 0.81, "learning_rate": 1.8129070611054466e-06, "loss": 1.2341, "step": 29702 }, { "epoch": 0.81, "learning_rate": 1.8123992018209502e-06, "loss": 1.3884, "step": 29703 }, { "epoch": 0.81, "learning_rate": 1.8118914065923908e-06, "loss": 1.3567, "step": 29704 }, { "epoch": 0.81, "learning_rate": 1.8113836754237446e-06, "loss": 1.3115, "step": 29705 }, { "epoch": 0.81, "learning_rate": 1.8108760083189825e-06, "loss": 1.1497, "step": 29706 }, { "epoch": 0.81, "learning_rate": 1.8103684052820759e-06, "loss": 1.3682, "step": 29707 }, { "epoch": 0.81, "learning_rate": 1.8098608663169925e-06, "loss": 1.303, "step": 29708 }, { "epoch": 0.81, "learning_rate": 1.8093533914277095e-06, "loss": 1.1624, "step": 29709 }, { "epoch": 0.81, "learning_rate": 1.8088459806181946e-06, "loss": 1.7676, "step": 29710 }, { "epoch": 0.81, "learning_rate": 1.8083386338924159e-06, "loss": 1.2607, "step": 29711 }, { "epoch": 0.81, "learning_rate": 1.8078313512543422e-06, "loss": 1.2402, "step": 29712 }, { "epoch": 0.81, "learning_rate": 1.807324132707945e-06, "loss": 1.2152, "step": 29713 }, { "epoch": 0.81, "learning_rate": 1.806816978257192e-06, "loss": 1.2314, "step": 29714 }, { "epoch": 0.81, "learning_rate": 1.8063098879060503e-06, "loss": 1.3267, "step": 29715 }, { "epoch": 0.81, "learning_rate": 1.8058028616584856e-06, "loss": 1.3276, "step": 29716 }, { "epoch": 0.81, "learning_rate": 1.8052958995184644e-06, "loss": 1.2957, "step": 29717 }, { "epoch": 0.81, "learning_rate": 1.8047890014899606e-06, "loss": 1.1365, "step": 29718 }, { "epoch": 0.81, "learning_rate": 1.8042821675769284e-06, "loss": 1.1516, "step": 29719 }, { "epoch": 0.81, "learning_rate": 1.8037753977833416e-06, "loss": 1.3765, "step": 29720 }, { "epoch": 0.81, "learning_rate": 1.8032686921131593e-06, "loss": 1.1829, "step": 29721 }, { "epoch": 0.81, "learning_rate": 1.8027620505703514e-06, "loss": 1.1653, "step": 29722 }, { "epoch": 0.81, "learning_rate": 1.8022554731588782e-06, "loss": 1.1482, "step": 29723 }, { "epoch": 0.81, "learning_rate": 1.801748959882703e-06, "loss": 1.1646, "step": 29724 }, { "epoch": 0.81, "learning_rate": 1.8012425107457865e-06, "loss": 1.241, "step": 29725 }, { "epoch": 0.81, "learning_rate": 1.800736125752096e-06, "loss": 1.3105, "step": 29726 }, { "epoch": 0.81, "learning_rate": 1.8002298049055911e-06, "loss": 1.3364, "step": 29727 }, { "epoch": 0.81, "learning_rate": 1.7997235482102314e-06, "loss": 1.2468, "step": 29728 }, { "epoch": 0.81, "learning_rate": 1.7992173556699766e-06, "loss": 1.1519, "step": 29729 }, { "epoch": 0.81, "learning_rate": 1.7987112272887908e-06, "loss": 1.3035, "step": 29730 }, { "epoch": 0.81, "learning_rate": 1.7982051630706322e-06, "loss": 1.3831, "step": 29731 }, { "epoch": 0.81, "learning_rate": 1.7976991630194574e-06, "loss": 1.1919, "step": 29732 }, { "epoch": 0.81, "learning_rate": 1.79719322713923e-06, "loss": 1.2612, "step": 29733 }, { "epoch": 0.81, "learning_rate": 1.7966873554339048e-06, "loss": 1.257, "step": 29734 }, { "epoch": 0.81, "learning_rate": 1.7961815479074407e-06, "loss": 1.3137, "step": 29735 }, { "epoch": 0.81, "learning_rate": 1.7956758045637922e-06, "loss": 1.2295, "step": 29736 }, { "epoch": 0.81, "learning_rate": 1.795170125406921e-06, "loss": 1.3049, "step": 29737 }, { "epoch": 0.81, "learning_rate": 1.79466451044078e-06, "loss": 1.2632, "step": 29738 }, { "epoch": 0.81, "learning_rate": 1.7941589596693254e-06, "loss": 1.4312, "step": 29739 }, { "epoch": 0.81, "learning_rate": 1.7936534730965105e-06, "loss": 1.314, "step": 29740 }, { "epoch": 0.81, "learning_rate": 1.7931480507262933e-06, "loss": 1.3499, "step": 29741 }, { "epoch": 0.81, "learning_rate": 1.7926426925626273e-06, "loss": 1.3743, "step": 29742 }, { "epoch": 0.81, "learning_rate": 1.792137398609466e-06, "loss": 1.3469, "step": 29743 }, { "epoch": 0.81, "learning_rate": 1.7916321688707593e-06, "loss": 1.158, "step": 29744 }, { "epoch": 0.81, "learning_rate": 1.7911270033504647e-06, "loss": 1.2822, "step": 29745 }, { "epoch": 0.81, "learning_rate": 1.7906219020525329e-06, "loss": 1.291, "step": 29746 }, { "epoch": 0.81, "learning_rate": 1.790116864980912e-06, "loss": 1.3145, "step": 29747 }, { "epoch": 0.81, "learning_rate": 1.789611892139559e-06, "loss": 1.3108, "step": 29748 }, { "epoch": 0.81, "learning_rate": 1.7891069835324216e-06, "loss": 1.3528, "step": 29749 }, { "epoch": 0.81, "learning_rate": 1.78860213916345e-06, "loss": 1.2944, "step": 29750 }, { "epoch": 0.81, "learning_rate": 1.7880973590365924e-06, "loss": 1.0281, "step": 29751 }, { "epoch": 0.81, "learning_rate": 1.787592643155801e-06, "loss": 1.1643, "step": 29752 }, { "epoch": 0.81, "learning_rate": 1.7870879915250206e-06, "loss": 1.3704, "step": 29753 }, { "epoch": 0.81, "learning_rate": 1.7865834041482078e-06, "loss": 1.1299, "step": 29754 }, { "epoch": 0.81, "learning_rate": 1.7860788810292983e-06, "loss": 1.3188, "step": 29755 }, { "epoch": 0.81, "learning_rate": 1.7855744221722482e-06, "loss": 1.2068, "step": 29756 }, { "epoch": 0.81, "learning_rate": 1.7850700275809973e-06, "loss": 1.291, "step": 29757 }, { "epoch": 0.81, "learning_rate": 1.7845656972595015e-06, "loss": 1.3384, "step": 29758 }, { "epoch": 0.81, "learning_rate": 1.7840614312116966e-06, "loss": 1.4685, "step": 29759 }, { "epoch": 0.81, "learning_rate": 1.7835572294415326e-06, "loss": 1.1196, "step": 29760 }, { "epoch": 0.81, "learning_rate": 1.783053091952951e-06, "loss": 1.2793, "step": 29761 }, { "epoch": 0.81, "learning_rate": 1.7825490187499005e-06, "loss": 1.2068, "step": 29762 }, { "epoch": 0.81, "learning_rate": 1.7820450098363228e-06, "loss": 1.1562, "step": 29763 }, { "epoch": 0.81, "learning_rate": 1.7815410652161592e-06, "loss": 1.3364, "step": 29764 }, { "epoch": 0.81, "learning_rate": 1.781037184893354e-06, "loss": 1.1882, "step": 29765 }, { "epoch": 0.81, "learning_rate": 1.7805333688718507e-06, "loss": 1.0945, "step": 29766 }, { "epoch": 0.81, "learning_rate": 1.7800296171555886e-06, "loss": 1.373, "step": 29767 }, { "epoch": 0.81, "learning_rate": 1.7795259297485067e-06, "loss": 1.2732, "step": 29768 }, { "epoch": 0.81, "learning_rate": 1.779022306654551e-06, "loss": 1.3103, "step": 29769 }, { "epoch": 0.81, "learning_rate": 1.7785187478776599e-06, "loss": 1.2805, "step": 29770 }, { "epoch": 0.81, "learning_rate": 1.7780152534217709e-06, "loss": 1.3235, "step": 29771 }, { "epoch": 0.81, "learning_rate": 1.7775118232908228e-06, "loss": 1.3093, "step": 29772 }, { "epoch": 0.81, "learning_rate": 1.777008457488757e-06, "loss": 1.6821, "step": 29773 }, { "epoch": 0.81, "learning_rate": 1.7765051560195113e-06, "loss": 1.1733, "step": 29774 }, { "epoch": 0.81, "learning_rate": 1.7760019188870214e-06, "loss": 1.1733, "step": 29775 }, { "epoch": 0.81, "learning_rate": 1.7754987460952244e-06, "loss": 1.2942, "step": 29776 }, { "epoch": 0.81, "learning_rate": 1.7749956376480593e-06, "loss": 1.1919, "step": 29777 }, { "epoch": 0.81, "learning_rate": 1.7744925935494606e-06, "loss": 1.2732, "step": 29778 }, { "epoch": 0.81, "learning_rate": 1.7739896138033608e-06, "loss": 1.1978, "step": 29779 }, { "epoch": 0.81, "learning_rate": 1.7734866984137011e-06, "loss": 1.354, "step": 29780 }, { "epoch": 0.81, "learning_rate": 1.772983847384414e-06, "loss": 1.29, "step": 29781 }, { "epoch": 0.81, "learning_rate": 1.772481060719432e-06, "loss": 1.3354, "step": 29782 }, { "epoch": 0.81, "learning_rate": 1.7719783384226863e-06, "loss": 1.4285, "step": 29783 }, { "epoch": 0.81, "learning_rate": 1.771475680498116e-06, "loss": 1.1633, "step": 29784 }, { "epoch": 0.81, "learning_rate": 1.770973086949651e-06, "loss": 1.3413, "step": 29785 }, { "epoch": 0.81, "learning_rate": 1.770470557781222e-06, "loss": 1.2668, "step": 29786 }, { "epoch": 0.81, "learning_rate": 1.76996809299676e-06, "loss": 1.2273, "step": 29787 }, { "epoch": 0.81, "learning_rate": 1.7694656926001997e-06, "loss": 1.2073, "step": 29788 }, { "epoch": 0.81, "learning_rate": 1.76896335659547e-06, "loss": 1.2734, "step": 29789 }, { "epoch": 0.81, "learning_rate": 1.7684610849865003e-06, "loss": 1.4277, "step": 29790 }, { "epoch": 0.81, "learning_rate": 1.7679588777772172e-06, "loss": 1.2861, "step": 29791 }, { "epoch": 0.81, "learning_rate": 1.7674567349715565e-06, "loss": 1.1702, "step": 29792 }, { "epoch": 0.81, "learning_rate": 1.766954656573442e-06, "loss": 1.3032, "step": 29793 }, { "epoch": 0.81, "learning_rate": 1.7664526425868012e-06, "loss": 1.177, "step": 29794 }, { "epoch": 0.81, "learning_rate": 1.7659506930155645e-06, "loss": 1.4033, "step": 29795 }, { "epoch": 0.81, "learning_rate": 1.7654488078636566e-06, "loss": 1.2869, "step": 29796 }, { "epoch": 0.81, "learning_rate": 1.764946987135009e-06, "loss": 1.2224, "step": 29797 }, { "epoch": 0.81, "learning_rate": 1.764445230833539e-06, "loss": 1.3469, "step": 29798 }, { "epoch": 0.81, "learning_rate": 1.7639435389631797e-06, "loss": 1.3284, "step": 29799 }, { "epoch": 0.81, "learning_rate": 1.7634419115278513e-06, "loss": 1.4009, "step": 29800 }, { "epoch": 0.81, "learning_rate": 1.7629403485314845e-06, "loss": 1.3796, "step": 29801 }, { "epoch": 0.81, "learning_rate": 1.7624388499779943e-06, "loss": 1.0964, "step": 29802 }, { "epoch": 0.81, "learning_rate": 1.761937415871311e-06, "loss": 1.2354, "step": 29803 }, { "epoch": 0.81, "learning_rate": 1.7614360462153536e-06, "loss": 1.2612, "step": 29804 }, { "epoch": 0.81, "learning_rate": 1.7609347410140509e-06, "loss": 1.3096, "step": 29805 }, { "epoch": 0.81, "learning_rate": 1.7604335002713158e-06, "loss": 1.1082, "step": 29806 }, { "epoch": 0.81, "learning_rate": 1.7599323239910782e-06, "loss": 1.3069, "step": 29807 }, { "epoch": 0.81, "learning_rate": 1.7594312121772516e-06, "loss": 1.3162, "step": 29808 }, { "epoch": 0.81, "learning_rate": 1.758930164833762e-06, "loss": 1.4009, "step": 29809 }, { "epoch": 0.81, "learning_rate": 1.7584291819645294e-06, "loss": 1.2981, "step": 29810 }, { "epoch": 0.81, "learning_rate": 1.7579282635734674e-06, "loss": 1.2371, "step": 29811 }, { "epoch": 0.81, "learning_rate": 1.7574274096645017e-06, "loss": 1.2761, "step": 29812 }, { "epoch": 0.81, "learning_rate": 1.756926620241549e-06, "loss": 1.3069, "step": 29813 }, { "epoch": 0.81, "learning_rate": 1.7564258953085257e-06, "loss": 1.3628, "step": 29814 }, { "epoch": 0.81, "learning_rate": 1.7559252348693468e-06, "loss": 1.3525, "step": 29815 }, { "epoch": 0.81, "learning_rate": 1.755424638927935e-06, "loss": 1.0547, "step": 29816 }, { "epoch": 0.81, "learning_rate": 1.754924107488204e-06, "loss": 1.0374, "step": 29817 }, { "epoch": 0.81, "learning_rate": 1.7544236405540704e-06, "loss": 1.0903, "step": 29818 }, { "epoch": 0.81, "learning_rate": 1.7539232381294458e-06, "loss": 1.2517, "step": 29819 }, { "epoch": 0.81, "learning_rate": 1.7534229002182502e-06, "loss": 1.7109, "step": 29820 }, { "epoch": 0.81, "learning_rate": 1.7529226268243972e-06, "loss": 1.29, "step": 29821 }, { "epoch": 0.81, "learning_rate": 1.7524224179517978e-06, "loss": 1.458, "step": 29822 }, { "epoch": 0.81, "learning_rate": 1.7519222736043662e-06, "loss": 1.2373, "step": 29823 }, { "epoch": 0.81, "learning_rate": 1.7514221937860188e-06, "loss": 1.106, "step": 29824 }, { "epoch": 0.81, "learning_rate": 1.7509221785006647e-06, "loss": 1.1843, "step": 29825 }, { "epoch": 0.81, "learning_rate": 1.7504222277522132e-06, "loss": 1.2717, "step": 29826 }, { "epoch": 0.81, "learning_rate": 1.749922341544582e-06, "loss": 1.2571, "step": 29827 }, { "epoch": 0.81, "learning_rate": 1.7494225198816795e-06, "loss": 1.3198, "step": 29828 }, { "epoch": 0.81, "learning_rate": 1.7489227627674155e-06, "loss": 1.2124, "step": 29829 }, { "epoch": 0.81, "learning_rate": 1.748423070205697e-06, "loss": 1.3535, "step": 29830 }, { "epoch": 0.81, "learning_rate": 1.7479234422004388e-06, "loss": 1.3311, "step": 29831 }, { "epoch": 0.81, "learning_rate": 1.7474238787555475e-06, "loss": 1.2859, "step": 29832 }, { "epoch": 0.81, "learning_rate": 1.7469243798749314e-06, "loss": 1.1255, "step": 29833 }, { "epoch": 0.81, "learning_rate": 1.7464249455624948e-06, "loss": 1.3562, "step": 29834 }, { "epoch": 0.81, "learning_rate": 1.7459255758221505e-06, "loss": 1.429, "step": 29835 }, { "epoch": 0.81, "learning_rate": 1.745426270657804e-06, "loss": 1.2378, "step": 29836 }, { "epoch": 0.81, "learning_rate": 1.7449270300733611e-06, "loss": 1.2986, "step": 29837 }, { "epoch": 0.81, "learning_rate": 1.7444278540727233e-06, "loss": 1.1821, "step": 29838 }, { "epoch": 0.81, "learning_rate": 1.743928742659804e-06, "loss": 1.259, "step": 29839 }, { "epoch": 0.81, "learning_rate": 1.7434296958385033e-06, "loss": 1.2527, "step": 29840 }, { "epoch": 0.81, "learning_rate": 1.7429307136127237e-06, "loss": 1.1846, "step": 29841 }, { "epoch": 0.81, "learning_rate": 1.7424317959863735e-06, "loss": 1.2371, "step": 29842 }, { "epoch": 0.81, "learning_rate": 1.7419329429633524e-06, "loss": 1.3635, "step": 29843 }, { "epoch": 0.82, "learning_rate": 1.7414341545475689e-06, "loss": 1.7061, "step": 29844 }, { "epoch": 0.82, "learning_rate": 1.740935430742916e-06, "loss": 1.2307, "step": 29845 }, { "epoch": 0.82, "learning_rate": 1.7404367715533043e-06, "loss": 1.3438, "step": 29846 }, { "epoch": 0.82, "learning_rate": 1.7399381769826273e-06, "loss": 1.1562, "step": 29847 }, { "epoch": 0.82, "learning_rate": 1.7394396470347963e-06, "loss": 1.1475, "step": 29848 }, { "epoch": 0.82, "learning_rate": 1.7389411817136991e-06, "loss": 1.7812, "step": 29849 }, { "epoch": 0.82, "learning_rate": 1.738442781023244e-06, "loss": 1.2898, "step": 29850 }, { "epoch": 0.82, "learning_rate": 1.7379444449673256e-06, "loss": 1.2786, "step": 29851 }, { "epoch": 0.82, "learning_rate": 1.7374461735498506e-06, "loss": 1.614, "step": 29852 }, { "epoch": 0.82, "learning_rate": 1.7369479667747046e-06, "loss": 1.2339, "step": 29853 }, { "epoch": 0.82, "learning_rate": 1.7364498246457962e-06, "loss": 1.2952, "step": 29854 }, { "epoch": 0.82, "learning_rate": 1.7359517471670152e-06, "loss": 1.2554, "step": 29855 }, { "epoch": 0.82, "learning_rate": 1.735453734342265e-06, "loss": 1.0793, "step": 29856 }, { "epoch": 0.82, "learning_rate": 1.7349557861754373e-06, "loss": 1.3027, "step": 29857 }, { "epoch": 0.82, "learning_rate": 1.734457902670428e-06, "loss": 1.4597, "step": 29858 }, { "epoch": 0.82, "learning_rate": 1.7339600838311343e-06, "loss": 1.1924, "step": 29859 }, { "epoch": 0.82, "learning_rate": 1.7334623296614506e-06, "loss": 1.2654, "step": 29860 }, { "epoch": 0.82, "learning_rate": 1.7329646401652712e-06, "loss": 1.3521, "step": 29861 }, { "epoch": 0.82, "learning_rate": 1.732467015346485e-06, "loss": 1.2236, "step": 29862 }, { "epoch": 0.82, "learning_rate": 1.7319694552089928e-06, "loss": 1.2734, "step": 29863 }, { "epoch": 0.82, "learning_rate": 1.7314719597566843e-06, "loss": 1.2598, "step": 29864 }, { "epoch": 0.82, "learning_rate": 1.73097452899345e-06, "loss": 1.197, "step": 29865 }, { "epoch": 0.82, "learning_rate": 1.7304771629231799e-06, "loss": 1.2712, "step": 29866 }, { "epoch": 0.82, "learning_rate": 1.729979861549771e-06, "loss": 1.3838, "step": 29867 }, { "epoch": 0.82, "learning_rate": 1.7294826248771102e-06, "loss": 1.1501, "step": 29868 }, { "epoch": 0.82, "learning_rate": 1.7289854529090887e-06, "loss": 1.2693, "step": 29869 }, { "epoch": 0.82, "learning_rate": 1.7284883456495938e-06, "loss": 1.1936, "step": 29870 }, { "epoch": 0.82, "learning_rate": 1.7279913031025176e-06, "loss": 1.1406, "step": 29871 }, { "epoch": 0.82, "learning_rate": 1.7274943252717492e-06, "loss": 1.2258, "step": 29872 }, { "epoch": 0.82, "learning_rate": 1.726997412161172e-06, "loss": 1.0415, "step": 29873 }, { "epoch": 0.82, "learning_rate": 1.726500563774679e-06, "loss": 1.2463, "step": 29874 }, { "epoch": 0.82, "learning_rate": 1.7260037801161556e-06, "loss": 1.3376, "step": 29875 }, { "epoch": 0.82, "learning_rate": 1.7255070611894875e-06, "loss": 1.0271, "step": 29876 }, { "epoch": 0.82, "learning_rate": 1.7250104069985585e-06, "loss": 1.2881, "step": 29877 }, { "epoch": 0.82, "learning_rate": 1.7245138175472608e-06, "loss": 1.2878, "step": 29878 }, { "epoch": 0.82, "learning_rate": 1.7240172928394738e-06, "loss": 1.2825, "step": 29879 }, { "epoch": 0.82, "learning_rate": 1.7235208328790854e-06, "loss": 1.2512, "step": 29880 }, { "epoch": 0.82, "learning_rate": 1.7230244376699746e-06, "loss": 1.3044, "step": 29881 }, { "epoch": 0.82, "learning_rate": 1.7225281072160315e-06, "loss": 1.1052, "step": 29882 }, { "epoch": 0.82, "learning_rate": 1.7220318415211357e-06, "loss": 1.3657, "step": 29883 }, { "epoch": 0.82, "learning_rate": 1.7215356405891703e-06, "loss": 1.157, "step": 29884 }, { "epoch": 0.82, "learning_rate": 1.7210395044240146e-06, "loss": 1.3223, "step": 29885 }, { "epoch": 0.82, "learning_rate": 1.7205434330295534e-06, "loss": 1.3059, "step": 29886 }, { "epoch": 0.82, "learning_rate": 1.7200474264096723e-06, "loss": 1.2715, "step": 29887 }, { "epoch": 0.82, "learning_rate": 1.7195514845682403e-06, "loss": 1.3008, "step": 29888 }, { "epoch": 0.82, "learning_rate": 1.719055607509148e-06, "loss": 1.197, "step": 29889 }, { "epoch": 0.82, "learning_rate": 1.7185597952362664e-06, "loss": 1.1477, "step": 29890 }, { "epoch": 0.82, "learning_rate": 1.718064047753485e-06, "loss": 1.2454, "step": 29891 }, { "epoch": 0.82, "learning_rate": 1.7175683650646701e-06, "loss": 1.0571, "step": 29892 }, { "epoch": 0.82, "learning_rate": 1.7170727471737093e-06, "loss": 1.1929, "step": 29893 }, { "epoch": 0.82, "learning_rate": 1.7165771940844734e-06, "loss": 1.3091, "step": 29894 }, { "epoch": 0.82, "learning_rate": 1.7160817058008472e-06, "loss": 1.2651, "step": 29895 }, { "epoch": 0.82, "learning_rate": 1.7155862823266978e-06, "loss": 1.2056, "step": 29896 }, { "epoch": 0.82, "learning_rate": 1.7150909236659076e-06, "loss": 1.2053, "step": 29897 }, { "epoch": 0.82, "learning_rate": 1.7145956298223476e-06, "loss": 1.2881, "step": 29898 }, { "epoch": 0.82, "learning_rate": 1.7141004007999006e-06, "loss": 1.4243, "step": 29899 }, { "epoch": 0.82, "learning_rate": 1.7136052366024314e-06, "loss": 1.2522, "step": 29900 }, { "epoch": 0.82, "learning_rate": 1.7131101372338198e-06, "loss": 1.6479, "step": 29901 }, { "epoch": 0.82, "learning_rate": 1.7126151026979353e-06, "loss": 1.2629, "step": 29902 }, { "epoch": 0.82, "learning_rate": 1.712120132998656e-06, "loss": 1.3237, "step": 29903 }, { "epoch": 0.82, "learning_rate": 1.7116252281398516e-06, "loss": 1.2244, "step": 29904 }, { "epoch": 0.82, "learning_rate": 1.7111303881253915e-06, "loss": 1.2898, "step": 29905 }, { "epoch": 0.82, "learning_rate": 1.7106356129591528e-06, "loss": 1.1931, "step": 29906 }, { "epoch": 0.82, "learning_rate": 1.7101409026450021e-06, "loss": 1.2271, "step": 29907 }, { "epoch": 0.82, "learning_rate": 1.709646257186811e-06, "loss": 1.2847, "step": 29908 }, { "epoch": 0.82, "learning_rate": 1.7091516765884464e-06, "loss": 1.1948, "step": 29909 }, { "epoch": 0.82, "learning_rate": 1.7086571608537839e-06, "loss": 1.3555, "step": 29910 }, { "epoch": 0.82, "learning_rate": 1.7081627099866883e-06, "loss": 1.2278, "step": 29911 }, { "epoch": 0.82, "learning_rate": 1.7076683239910285e-06, "loss": 1.1953, "step": 29912 }, { "epoch": 0.82, "learning_rate": 1.7071740028706697e-06, "loss": 1.3069, "step": 29913 }, { "epoch": 0.82, "learning_rate": 1.706679746629485e-06, "loss": 1.3342, "step": 29914 }, { "epoch": 0.82, "learning_rate": 1.706185555271337e-06, "loss": 1.3806, "step": 29915 }, { "epoch": 0.82, "learning_rate": 1.7056914288000947e-06, "loss": 1.3154, "step": 29916 }, { "epoch": 0.82, "learning_rate": 1.7051973672196188e-06, "loss": 1.0745, "step": 29917 }, { "epoch": 0.82, "learning_rate": 1.7047033705337812e-06, "loss": 1.3467, "step": 29918 }, { "epoch": 0.82, "learning_rate": 1.7042094387464436e-06, "loss": 1.3113, "step": 29919 }, { "epoch": 0.82, "learning_rate": 1.7037155718614684e-06, "loss": 1.323, "step": 29920 }, { "epoch": 0.82, "learning_rate": 1.7032217698827237e-06, "loss": 1.0278, "step": 29921 }, { "epoch": 0.82, "learning_rate": 1.7027280328140695e-06, "loss": 1.249, "step": 29922 }, { "epoch": 0.82, "learning_rate": 1.7022343606593706e-06, "loss": 1.2256, "step": 29923 }, { "epoch": 0.82, "learning_rate": 1.701740753422485e-06, "loss": 1.2332, "step": 29924 }, { "epoch": 0.82, "learning_rate": 1.701247211107281e-06, "loss": 1.1013, "step": 29925 }, { "epoch": 0.82, "learning_rate": 1.700753733717615e-06, "loss": 1.238, "step": 29926 }, { "epoch": 0.82, "learning_rate": 1.700260321257351e-06, "loss": 1.1299, "step": 29927 }, { "epoch": 0.82, "learning_rate": 1.6997669737303435e-06, "loss": 1.3833, "step": 29928 }, { "epoch": 0.82, "learning_rate": 1.6992736911404594e-06, "loss": 1.1979, "step": 29929 }, { "epoch": 0.82, "learning_rate": 1.6987804734915548e-06, "loss": 1.323, "step": 29930 }, { "epoch": 0.82, "learning_rate": 1.6982873207874872e-06, "loss": 1.355, "step": 29931 }, { "epoch": 0.82, "learning_rate": 1.697794233032114e-06, "loss": 1.26, "step": 29932 }, { "epoch": 0.82, "learning_rate": 1.6973012102292952e-06, "loss": 1.1489, "step": 29933 }, { "epoch": 0.82, "learning_rate": 1.6968082523828922e-06, "loss": 1.1453, "step": 29934 }, { "epoch": 0.82, "learning_rate": 1.6963153594967519e-06, "loss": 1.2195, "step": 29935 }, { "epoch": 0.82, "learning_rate": 1.695822531574738e-06, "loss": 1.0647, "step": 29936 }, { "epoch": 0.82, "learning_rate": 1.6953297686207016e-06, "loss": 1.2441, "step": 29937 }, { "epoch": 0.82, "learning_rate": 1.6948370706385043e-06, "loss": 1.3132, "step": 29938 }, { "epoch": 0.82, "learning_rate": 1.6943444376319918e-06, "loss": 1.2507, "step": 29939 }, { "epoch": 0.82, "learning_rate": 1.6938518696050255e-06, "loss": 1.3215, "step": 29940 }, { "epoch": 0.82, "learning_rate": 1.6933593665614534e-06, "loss": 1.2539, "step": 29941 }, { "epoch": 0.82, "learning_rate": 1.6928669285051368e-06, "loss": 1.3193, "step": 29942 }, { "epoch": 0.82, "learning_rate": 1.6923745554399184e-06, "loss": 1.3811, "step": 29943 }, { "epoch": 0.82, "learning_rate": 1.6918822473696572e-06, "loss": 1.188, "step": 29944 }, { "epoch": 0.82, "learning_rate": 1.6913900042982e-06, "loss": 1.3518, "step": 29945 }, { "epoch": 0.82, "learning_rate": 1.690897826229405e-06, "loss": 1.1987, "step": 29946 }, { "epoch": 0.82, "learning_rate": 1.6904057131671137e-06, "loss": 1.355, "step": 29947 }, { "epoch": 0.82, "learning_rate": 1.6899136651151804e-06, "loss": 1.2173, "step": 29948 }, { "epoch": 0.82, "learning_rate": 1.6894216820774577e-06, "loss": 1.3445, "step": 29949 }, { "epoch": 0.82, "learning_rate": 1.6889297640577918e-06, "loss": 1.248, "step": 29950 }, { "epoch": 0.82, "learning_rate": 1.6884379110600313e-06, "loss": 1.2334, "step": 29951 }, { "epoch": 0.82, "learning_rate": 1.6879461230880212e-06, "loss": 1.3477, "step": 29952 }, { "epoch": 0.82, "learning_rate": 1.687454400145615e-06, "loss": 1.116, "step": 29953 }, { "epoch": 0.82, "learning_rate": 1.6869627422366575e-06, "loss": 1.3923, "step": 29954 }, { "epoch": 0.82, "learning_rate": 1.6864711493649932e-06, "loss": 1.2808, "step": 29955 }, { "epoch": 0.82, "learning_rate": 1.6859796215344671e-06, "loss": 1.2578, "step": 29956 }, { "epoch": 0.82, "learning_rate": 1.6854881587489303e-06, "loss": 1.2275, "step": 29957 }, { "epoch": 0.82, "learning_rate": 1.684996761012223e-06, "loss": 1.1951, "step": 29958 }, { "epoch": 0.82, "learning_rate": 1.6845054283281915e-06, "loss": 1.2876, "step": 29959 }, { "epoch": 0.82, "learning_rate": 1.6840141607006777e-06, "loss": 1.2629, "step": 29960 }, { "epoch": 0.82, "learning_rate": 1.6835229581335277e-06, "loss": 1.3379, "step": 29961 }, { "epoch": 0.82, "learning_rate": 1.683031820630584e-06, "loss": 1.2871, "step": 29962 }, { "epoch": 0.82, "learning_rate": 1.682540748195689e-06, "loss": 1.342, "step": 29963 }, { "epoch": 0.82, "learning_rate": 1.6820497408326808e-06, "loss": 1.3474, "step": 29964 }, { "epoch": 0.82, "learning_rate": 1.6815587985454074e-06, "loss": 1.3943, "step": 29965 }, { "epoch": 0.82, "learning_rate": 1.6810679213377058e-06, "loss": 1.189, "step": 29966 }, { "epoch": 0.82, "learning_rate": 1.680577109213415e-06, "loss": 1.3123, "step": 29967 }, { "epoch": 0.82, "learning_rate": 1.6800863621763786e-06, "loss": 1.2478, "step": 29968 }, { "epoch": 0.82, "learning_rate": 1.6795956802304336e-06, "loss": 1.1174, "step": 29969 }, { "epoch": 0.82, "learning_rate": 1.6791050633794204e-06, "loss": 1.281, "step": 29970 }, { "epoch": 0.82, "learning_rate": 1.6786145116271747e-06, "loss": 1.2566, "step": 29971 }, { "epoch": 0.82, "learning_rate": 1.6781240249775376e-06, "loss": 1.2078, "step": 29972 }, { "epoch": 0.82, "learning_rate": 1.6776336034343444e-06, "loss": 1.2261, "step": 29973 }, { "epoch": 0.82, "learning_rate": 1.6771432470014326e-06, "loss": 1.3362, "step": 29974 }, { "epoch": 0.82, "learning_rate": 1.6766529556826373e-06, "loss": 1.3662, "step": 29975 }, { "epoch": 0.82, "learning_rate": 1.676162729481796e-06, "loss": 1.1326, "step": 29976 }, { "epoch": 0.82, "learning_rate": 1.6756725684027442e-06, "loss": 1.2981, "step": 29977 }, { "epoch": 0.82, "learning_rate": 1.675182472449316e-06, "loss": 1.238, "step": 29978 }, { "epoch": 0.82, "learning_rate": 1.6746924416253429e-06, "loss": 1.1982, "step": 29979 }, { "epoch": 0.82, "learning_rate": 1.674202475934662e-06, "loss": 1.1274, "step": 29980 }, { "epoch": 0.82, "learning_rate": 1.6737125753811101e-06, "loss": 1.29, "step": 29981 }, { "epoch": 0.82, "learning_rate": 1.6732227399685107e-06, "loss": 1.3506, "step": 29982 }, { "epoch": 0.82, "learning_rate": 1.6727329697007033e-06, "loss": 1.3254, "step": 29983 }, { "epoch": 0.82, "learning_rate": 1.6722432645815157e-06, "loss": 1.3066, "step": 29984 }, { "epoch": 0.82, "learning_rate": 1.6717536246147826e-06, "loss": 1.2185, "step": 29985 }, { "epoch": 0.82, "learning_rate": 1.671264049804333e-06, "loss": 1.0706, "step": 29986 }, { "epoch": 0.82, "learning_rate": 1.6707745401539964e-06, "loss": 1.7083, "step": 29987 }, { "epoch": 0.82, "learning_rate": 1.670285095667602e-06, "loss": 1.1335, "step": 29988 }, { "epoch": 0.82, "learning_rate": 1.669795716348982e-06, "loss": 1.3567, "step": 29989 }, { "epoch": 0.82, "learning_rate": 1.6693064022019633e-06, "loss": 1.2231, "step": 29990 }, { "epoch": 0.82, "learning_rate": 1.6688171532303731e-06, "loss": 1.1404, "step": 29991 }, { "epoch": 0.82, "learning_rate": 1.6683279694380383e-06, "loss": 1.2734, "step": 29992 }, { "epoch": 0.82, "learning_rate": 1.6678388508287902e-06, "loss": 1.2354, "step": 29993 }, { "epoch": 0.82, "learning_rate": 1.6673497974064524e-06, "loss": 1.6851, "step": 29994 }, { "epoch": 0.82, "learning_rate": 1.6668608091748495e-06, "loss": 1.4023, "step": 29995 }, { "epoch": 0.82, "learning_rate": 1.666371886137811e-06, "loss": 1.2639, "step": 29996 }, { "epoch": 0.82, "learning_rate": 1.665883028299161e-06, "loss": 1.2861, "step": 29997 }, { "epoch": 0.82, "learning_rate": 1.665394235662723e-06, "loss": 1.2322, "step": 29998 }, { "epoch": 0.82, "learning_rate": 1.6649055082323185e-06, "loss": 1.3313, "step": 29999 }, { "epoch": 0.82, "learning_rate": 1.664416846011776e-06, "loss": 1.1819, "step": 30000 }, { "epoch": 0.82, "learning_rate": 1.663928249004917e-06, "loss": 1.386, "step": 30001 }, { "epoch": 0.82, "learning_rate": 1.6634397172155625e-06, "loss": 1.2761, "step": 30002 }, { "epoch": 0.82, "learning_rate": 1.6629512506475342e-06, "loss": 1.1362, "step": 30003 }, { "epoch": 0.82, "learning_rate": 1.6624628493046568e-06, "loss": 1.1689, "step": 30004 }, { "epoch": 0.82, "learning_rate": 1.6619745131907494e-06, "loss": 1.2935, "step": 30005 }, { "epoch": 0.82, "learning_rate": 1.6614862423096335e-06, "loss": 1.4443, "step": 30006 }, { "epoch": 0.82, "learning_rate": 1.6609980366651245e-06, "loss": 1.324, "step": 30007 }, { "epoch": 0.82, "learning_rate": 1.660509896261049e-06, "loss": 1.1316, "step": 30008 }, { "epoch": 0.82, "learning_rate": 1.660021821101222e-06, "loss": 1.2954, "step": 30009 }, { "epoch": 0.82, "learning_rate": 1.65953381118946e-06, "loss": 1.2112, "step": 30010 }, { "epoch": 0.82, "learning_rate": 1.6590458665295873e-06, "loss": 1.2424, "step": 30011 }, { "epoch": 0.82, "learning_rate": 1.6585579871254154e-06, "loss": 1.3608, "step": 30012 }, { "epoch": 0.82, "learning_rate": 1.6580701729807647e-06, "loss": 1.2239, "step": 30013 }, { "epoch": 0.82, "learning_rate": 1.6575824240994476e-06, "loss": 1.3779, "step": 30014 }, { "epoch": 0.82, "learning_rate": 1.6570947404852855e-06, "loss": 1.2046, "step": 30015 }, { "epoch": 0.82, "learning_rate": 1.6566071221420887e-06, "loss": 1.3499, "step": 30016 }, { "epoch": 0.82, "learning_rate": 1.6561195690736786e-06, "loss": 1.196, "step": 30017 }, { "epoch": 0.82, "learning_rate": 1.6556320812838612e-06, "loss": 1.2249, "step": 30018 }, { "epoch": 0.82, "learning_rate": 1.6551446587764563e-06, "loss": 1.3755, "step": 30019 }, { "epoch": 0.82, "learning_rate": 1.6546573015552735e-06, "loss": 1.3091, "step": 30020 }, { "epoch": 0.82, "learning_rate": 1.6541700096241332e-06, "loss": 1.2141, "step": 30021 }, { "epoch": 0.82, "learning_rate": 1.6536827829868363e-06, "loss": 1.188, "step": 30022 }, { "epoch": 0.82, "learning_rate": 1.6531956216472035e-06, "loss": 1.2795, "step": 30023 }, { "epoch": 0.82, "learning_rate": 1.6527085256090414e-06, "loss": 1.2766, "step": 30024 }, { "epoch": 0.82, "learning_rate": 1.6522214948761671e-06, "loss": 1.3059, "step": 30025 }, { "epoch": 0.82, "learning_rate": 1.6517345294523812e-06, "loss": 1.3115, "step": 30026 }, { "epoch": 0.82, "learning_rate": 1.6512476293414992e-06, "loss": 1.2751, "step": 30027 }, { "epoch": 0.82, "learning_rate": 1.6507607945473313e-06, "loss": 1.1721, "step": 30028 }, { "epoch": 0.82, "learning_rate": 1.650274025073686e-06, "loss": 1.3926, "step": 30029 }, { "epoch": 0.82, "learning_rate": 1.6497873209243698e-06, "loss": 1.2971, "step": 30030 }, { "epoch": 0.82, "learning_rate": 1.6493006821031887e-06, "loss": 1.3665, "step": 30031 }, { "epoch": 0.82, "learning_rate": 1.6488141086139552e-06, "loss": 1.3665, "step": 30032 }, { "epoch": 0.82, "learning_rate": 1.648327600460472e-06, "loss": 1.304, "step": 30033 }, { "epoch": 0.82, "learning_rate": 1.6478411576465481e-06, "loss": 1.2014, "step": 30034 }, { "epoch": 0.82, "learning_rate": 1.6473547801759838e-06, "loss": 1.3013, "step": 30035 }, { "epoch": 0.82, "learning_rate": 1.6468684680525904e-06, "loss": 1.1028, "step": 30036 }, { "epoch": 0.82, "learning_rate": 1.6463822212801706e-06, "loss": 1.2761, "step": 30037 }, { "epoch": 0.82, "learning_rate": 1.645896039862529e-06, "loss": 1.1602, "step": 30038 }, { "epoch": 0.82, "learning_rate": 1.6454099238034648e-06, "loss": 1.3264, "step": 30039 }, { "epoch": 0.82, "learning_rate": 1.6449238731067874e-06, "loss": 1.24, "step": 30040 }, { "epoch": 0.82, "learning_rate": 1.6444378877762968e-06, "loss": 1.2947, "step": 30041 }, { "epoch": 0.82, "learning_rate": 1.6439519678157922e-06, "loss": 1.314, "step": 30042 }, { "epoch": 0.82, "learning_rate": 1.643466113229082e-06, "loss": 1.3149, "step": 30043 }, { "epoch": 0.82, "learning_rate": 1.6429803240199626e-06, "loss": 1.2607, "step": 30044 }, { "epoch": 0.82, "learning_rate": 1.6424946001922348e-06, "loss": 1.3037, "step": 30045 }, { "epoch": 0.82, "learning_rate": 1.6420089417496977e-06, "loss": 1.188, "step": 30046 }, { "epoch": 0.82, "learning_rate": 1.6415233486961546e-06, "loss": 1.2937, "step": 30047 }, { "epoch": 0.82, "learning_rate": 1.6410378210354017e-06, "loss": 1.2998, "step": 30048 }, { "epoch": 0.82, "learning_rate": 1.6405523587712392e-06, "loss": 1.1077, "step": 30049 }, { "epoch": 0.82, "learning_rate": 1.6400669619074616e-06, "loss": 1.1343, "step": 30050 }, { "epoch": 0.82, "learning_rate": 1.6395816304478706e-06, "loss": 1.2662, "step": 30051 }, { "epoch": 0.82, "learning_rate": 1.639096364396262e-06, "loss": 1.2549, "step": 30052 }, { "epoch": 0.82, "learning_rate": 1.6386111637564328e-06, "loss": 1.1685, "step": 30053 }, { "epoch": 0.82, "learning_rate": 1.6381260285321743e-06, "loss": 1.3977, "step": 30054 }, { "epoch": 0.82, "learning_rate": 1.637640958727289e-06, "loss": 1.2234, "step": 30055 }, { "epoch": 0.82, "learning_rate": 1.6371559543455683e-06, "loss": 1.231, "step": 30056 }, { "epoch": 0.82, "learning_rate": 1.6366710153908038e-06, "loss": 1.2832, "step": 30057 }, { "epoch": 0.82, "learning_rate": 1.6361861418667956e-06, "loss": 1.1853, "step": 30058 }, { "epoch": 0.82, "learning_rate": 1.635701333777332e-06, "loss": 1.3992, "step": 30059 }, { "epoch": 0.82, "learning_rate": 1.635216591126213e-06, "loss": 1.2085, "step": 30060 }, { "epoch": 0.82, "learning_rate": 1.6347319139172202e-06, "loss": 1.2227, "step": 30061 }, { "epoch": 0.82, "learning_rate": 1.634247302154155e-06, "loss": 1.2871, "step": 30062 }, { "epoch": 0.82, "learning_rate": 1.633762755840801e-06, "loss": 1.8066, "step": 30063 }, { "epoch": 0.82, "learning_rate": 1.6332782749809595e-06, "loss": 1.3081, "step": 30064 }, { "epoch": 0.82, "learning_rate": 1.6327938595784086e-06, "loss": 1.2473, "step": 30065 }, { "epoch": 0.82, "learning_rate": 1.6323095096369469e-06, "loss": 1.3162, "step": 30066 }, { "epoch": 0.82, "learning_rate": 1.6318252251603583e-06, "loss": 1.167, "step": 30067 }, { "epoch": 0.82, "learning_rate": 1.6313410061524393e-06, "loss": 1.2695, "step": 30068 }, { "epoch": 0.82, "learning_rate": 1.6308568526169677e-06, "loss": 1.1045, "step": 30069 }, { "epoch": 0.82, "learning_rate": 1.6303727645577394e-06, "loss": 1.3513, "step": 30070 }, { "epoch": 0.82, "learning_rate": 1.6298887419785358e-06, "loss": 1.2034, "step": 30071 }, { "epoch": 0.82, "learning_rate": 1.6294047848831496e-06, "loss": 1.0625, "step": 30072 }, { "epoch": 0.82, "learning_rate": 1.6289208932753641e-06, "loss": 1.3535, "step": 30073 }, { "epoch": 0.82, "learning_rate": 1.6284370671589634e-06, "loss": 1.1406, "step": 30074 }, { "epoch": 0.82, "learning_rate": 1.6279533065377363e-06, "loss": 1.3032, "step": 30075 }, { "epoch": 0.82, "learning_rate": 1.6274696114154663e-06, "loss": 1.2102, "step": 30076 }, { "epoch": 0.82, "learning_rate": 1.6269859817959367e-06, "loss": 1.4375, "step": 30077 }, { "epoch": 0.82, "learning_rate": 1.6265024176829292e-06, "loss": 1.2722, "step": 30078 }, { "epoch": 0.82, "learning_rate": 1.626018919080231e-06, "loss": 1.311, "step": 30079 }, { "epoch": 0.82, "learning_rate": 1.6255354859916238e-06, "loss": 1.2502, "step": 30080 }, { "epoch": 0.82, "learning_rate": 1.625052118420889e-06, "loss": 1.3047, "step": 30081 }, { "epoch": 0.82, "learning_rate": 1.6245688163718054e-06, "loss": 1.2184, "step": 30082 }, { "epoch": 0.82, "learning_rate": 1.6240855798481603e-06, "loss": 1.2567, "step": 30083 }, { "epoch": 0.82, "learning_rate": 1.6236024088537294e-06, "loss": 1.1418, "step": 30084 }, { "epoch": 0.82, "learning_rate": 1.6231193033922955e-06, "loss": 1.3379, "step": 30085 }, { "epoch": 0.82, "learning_rate": 1.6226362634676351e-06, "loss": 1.748, "step": 30086 }, { "epoch": 0.82, "learning_rate": 1.6221532890835312e-06, "loss": 1.2634, "step": 30087 }, { "epoch": 0.82, "learning_rate": 1.6216703802437593e-06, "loss": 1.1042, "step": 30088 }, { "epoch": 0.82, "learning_rate": 1.621187536952098e-06, "loss": 1.3975, "step": 30089 }, { "epoch": 0.82, "learning_rate": 1.620704759212327e-06, "loss": 1.2693, "step": 30090 }, { "epoch": 0.82, "learning_rate": 1.6202220470282214e-06, "loss": 1.2581, "step": 30091 }, { "epoch": 0.82, "learning_rate": 1.6197394004035582e-06, "loss": 1.2925, "step": 30092 }, { "epoch": 0.82, "learning_rate": 1.619256819342111e-06, "loss": 1.3818, "step": 30093 }, { "epoch": 0.82, "learning_rate": 1.6187743038476599e-06, "loss": 1.1631, "step": 30094 }, { "epoch": 0.82, "learning_rate": 1.6182918539239779e-06, "loss": 1.1201, "step": 30095 }, { "epoch": 0.82, "learning_rate": 1.6178094695748393e-06, "loss": 1.2422, "step": 30096 }, { "epoch": 0.82, "learning_rate": 1.6173271508040144e-06, "loss": 1.3552, "step": 30097 }, { "epoch": 0.82, "learning_rate": 1.6168448976152829e-06, "loss": 1.3176, "step": 30098 }, { "epoch": 0.82, "learning_rate": 1.6163627100124147e-06, "loss": 1.3477, "step": 30099 }, { "epoch": 0.82, "learning_rate": 1.6158805879991834e-06, "loss": 1.1531, "step": 30100 }, { "epoch": 0.82, "learning_rate": 1.6153985315793562e-06, "loss": 1.2273, "step": 30101 }, { "epoch": 0.82, "learning_rate": 1.6149165407567113e-06, "loss": 1.2832, "step": 30102 }, { "epoch": 0.82, "learning_rate": 1.6144346155350166e-06, "loss": 1.3533, "step": 30103 }, { "epoch": 0.82, "learning_rate": 1.613952755918039e-06, "loss": 1.218, "step": 30104 }, { "epoch": 0.82, "learning_rate": 1.6134709619095545e-06, "loss": 1.2258, "step": 30105 }, { "epoch": 0.82, "learning_rate": 1.6129892335133279e-06, "loss": 1.3179, "step": 30106 }, { "epoch": 0.82, "learning_rate": 1.6125075707331339e-06, "loss": 1.1631, "step": 30107 }, { "epoch": 0.82, "learning_rate": 1.6120259735727318e-06, "loss": 1.3191, "step": 30108 }, { "epoch": 0.82, "learning_rate": 1.6115444420358962e-06, "loss": 1.2954, "step": 30109 }, { "epoch": 0.82, "learning_rate": 1.6110629761263897e-06, "loss": 1.2871, "step": 30110 }, { "epoch": 0.82, "learning_rate": 1.610581575847987e-06, "loss": 1.3013, "step": 30111 }, { "epoch": 0.82, "learning_rate": 1.6101002412044454e-06, "loss": 1.1731, "step": 30112 }, { "epoch": 0.82, "learning_rate": 1.6096189721995347e-06, "loss": 1.366, "step": 30113 }, { "epoch": 0.82, "learning_rate": 1.609137768837019e-06, "loss": 1.3757, "step": 30114 }, { "epoch": 0.82, "learning_rate": 1.6086566311206675e-06, "loss": 1.241, "step": 30115 }, { "epoch": 0.82, "learning_rate": 1.6081755590542358e-06, "loss": 1.2571, "step": 30116 }, { "epoch": 0.82, "learning_rate": 1.6076945526414955e-06, "loss": 1.6719, "step": 30117 }, { "epoch": 0.82, "learning_rate": 1.6072136118862035e-06, "loss": 1.1624, "step": 30118 }, { "epoch": 0.82, "learning_rate": 1.6067327367921293e-06, "loss": 1.2808, "step": 30119 }, { "epoch": 0.82, "learning_rate": 1.6062519273630307e-06, "loss": 1.2258, "step": 30120 }, { "epoch": 0.82, "learning_rate": 1.6057711836026668e-06, "loss": 1.28, "step": 30121 }, { "epoch": 0.82, "learning_rate": 1.605290505514805e-06, "loss": 1.3115, "step": 30122 }, { "epoch": 0.82, "learning_rate": 1.604809893103203e-06, "loss": 1.2844, "step": 30123 }, { "epoch": 0.82, "learning_rate": 1.6043293463716202e-06, "loss": 1.3948, "step": 30124 }, { "epoch": 0.82, "learning_rate": 1.6038488653238149e-06, "loss": 1.0552, "step": 30125 }, { "epoch": 0.82, "learning_rate": 1.6033684499635504e-06, "loss": 1.2874, "step": 30126 }, { "epoch": 0.82, "learning_rate": 1.6028881002945817e-06, "loss": 1.2817, "step": 30127 }, { "epoch": 0.82, "learning_rate": 1.6024078163206692e-06, "loss": 1.3058, "step": 30128 }, { "epoch": 0.82, "learning_rate": 1.6019275980455662e-06, "loss": 1.3191, "step": 30129 }, { "epoch": 0.82, "learning_rate": 1.6014474454730345e-06, "loss": 1.2688, "step": 30130 }, { "epoch": 0.82, "learning_rate": 1.6009673586068286e-06, "loss": 1.2412, "step": 30131 }, { "epoch": 0.82, "learning_rate": 1.6004873374507057e-06, "loss": 1.1342, "step": 30132 }, { "epoch": 0.82, "learning_rate": 1.6000073820084172e-06, "loss": 1.2419, "step": 30133 }, { "epoch": 0.82, "learning_rate": 1.5995274922837233e-06, "loss": 1.2898, "step": 30134 }, { "epoch": 0.82, "learning_rate": 1.5990476682803757e-06, "loss": 1.1165, "step": 30135 }, { "epoch": 0.82, "learning_rate": 1.5985679100021268e-06, "loss": 1.2021, "step": 30136 }, { "epoch": 0.82, "learning_rate": 1.5980882174527346e-06, "loss": 1.3523, "step": 30137 }, { "epoch": 0.82, "learning_rate": 1.5976085906359496e-06, "loss": 1.2466, "step": 30138 }, { "epoch": 0.82, "learning_rate": 1.597129029555523e-06, "loss": 1.3018, "step": 30139 }, { "epoch": 0.82, "learning_rate": 1.5966495342152054e-06, "loss": 1.1328, "step": 30140 }, { "epoch": 0.82, "learning_rate": 1.5961701046187527e-06, "loss": 1.4424, "step": 30141 }, { "epoch": 0.82, "learning_rate": 1.595690740769914e-06, "loss": 1.2598, "step": 30142 }, { "epoch": 0.82, "learning_rate": 1.5952114426724385e-06, "loss": 1.4082, "step": 30143 }, { "epoch": 0.82, "learning_rate": 1.5947322103300734e-06, "loss": 1.4106, "step": 30144 }, { "epoch": 0.82, "learning_rate": 1.5942530437465742e-06, "loss": 1.1484, "step": 30145 }, { "epoch": 0.82, "learning_rate": 1.5937739429256872e-06, "loss": 1.6392, "step": 30146 }, { "epoch": 0.82, "learning_rate": 1.593294907871159e-06, "loss": 1.2922, "step": 30147 }, { "epoch": 0.82, "learning_rate": 1.592815938586736e-06, "loss": 1.4067, "step": 30148 }, { "epoch": 0.82, "learning_rate": 1.5923370350761703e-06, "loss": 1.325, "step": 30149 }, { "epoch": 0.82, "learning_rate": 1.5918581973432057e-06, "loss": 1.1992, "step": 30150 }, { "epoch": 0.82, "learning_rate": 1.591379425391587e-06, "loss": 1.4338, "step": 30151 }, { "epoch": 0.82, "learning_rate": 1.5909007192250637e-06, "loss": 1.271, "step": 30152 }, { "epoch": 0.82, "learning_rate": 1.5904220788473767e-06, "loss": 1.3691, "step": 30153 }, { "epoch": 0.82, "learning_rate": 1.5899435042622768e-06, "loss": 1.2239, "step": 30154 }, { "epoch": 0.82, "learning_rate": 1.589464995473501e-06, "loss": 1.1362, "step": 30155 }, { "epoch": 0.82, "learning_rate": 1.5889865524847981e-06, "loss": 1.3506, "step": 30156 }, { "epoch": 0.82, "learning_rate": 1.5885081752999064e-06, "loss": 1.3333, "step": 30157 }, { "epoch": 0.82, "learning_rate": 1.5880298639225765e-06, "loss": 1.1953, "step": 30158 }, { "epoch": 0.82, "learning_rate": 1.5875516183565398e-06, "loss": 1.1535, "step": 30159 }, { "epoch": 0.82, "learning_rate": 1.5870734386055464e-06, "loss": 1.2244, "step": 30160 }, { "epoch": 0.82, "learning_rate": 1.5865953246733323e-06, "loss": 1.2639, "step": 30161 }, { "epoch": 0.82, "learning_rate": 1.5861172765636447e-06, "loss": 1.3938, "step": 30162 }, { "epoch": 0.82, "learning_rate": 1.5856392942802145e-06, "loss": 1.2893, "step": 30163 }, { "epoch": 0.82, "learning_rate": 1.5851613778267872e-06, "loss": 1.2705, "step": 30164 }, { "epoch": 0.82, "learning_rate": 1.5846835272070992e-06, "loss": 1.1487, "step": 30165 }, { "epoch": 0.82, "learning_rate": 1.5842057424248913e-06, "loss": 1.3318, "step": 30166 }, { "epoch": 0.82, "learning_rate": 1.5837280234839013e-06, "loss": 1.2507, "step": 30167 }, { "epoch": 0.82, "learning_rate": 1.5832503703878633e-06, "loss": 1.2153, "step": 30168 }, { "epoch": 0.82, "learning_rate": 1.5827727831405183e-06, "loss": 1.1824, "step": 30169 }, { "epoch": 0.82, "learning_rate": 1.5822952617456011e-06, "loss": 1.2545, "step": 30170 }, { "epoch": 0.82, "learning_rate": 1.5818178062068478e-06, "loss": 1.1654, "step": 30171 }, { "epoch": 0.82, "learning_rate": 1.58134041652799e-06, "loss": 1.2561, "step": 30172 }, { "epoch": 0.82, "learning_rate": 1.5808630927127699e-06, "loss": 1.2114, "step": 30173 }, { "epoch": 0.82, "learning_rate": 1.580385834764917e-06, "loss": 1.3066, "step": 30174 }, { "epoch": 0.82, "learning_rate": 1.5799086426881672e-06, "loss": 1.7334, "step": 30175 }, { "epoch": 0.82, "learning_rate": 1.5794315164862495e-06, "loss": 1.1548, "step": 30176 }, { "epoch": 0.82, "learning_rate": 1.5789544561629022e-06, "loss": 1.1687, "step": 30177 }, { "epoch": 0.82, "learning_rate": 1.5784774617218558e-06, "loss": 1.2231, "step": 30178 }, { "epoch": 0.82, "learning_rate": 1.5780005331668425e-06, "loss": 1.238, "step": 30179 }, { "epoch": 0.82, "learning_rate": 1.5775236705015894e-06, "loss": 1.2236, "step": 30180 }, { "epoch": 0.82, "learning_rate": 1.5770468737298328e-06, "loss": 1.0872, "step": 30181 }, { "epoch": 0.82, "learning_rate": 1.5765701428553004e-06, "loss": 1.345, "step": 30182 }, { "epoch": 0.82, "learning_rate": 1.5760934778817204e-06, "loss": 1.3074, "step": 30183 }, { "epoch": 0.82, "learning_rate": 1.5756168788128268e-06, "loss": 1.2732, "step": 30184 }, { "epoch": 0.82, "learning_rate": 1.575140345652345e-06, "loss": 1.2827, "step": 30185 }, { "epoch": 0.82, "learning_rate": 1.5746638784040025e-06, "loss": 1.2679, "step": 30186 }, { "epoch": 0.82, "learning_rate": 1.5741874770715272e-06, "loss": 1.3071, "step": 30187 }, { "epoch": 0.82, "learning_rate": 1.573711141658648e-06, "loss": 1.3157, "step": 30188 }, { "epoch": 0.82, "learning_rate": 1.5732348721690903e-06, "loss": 1.1199, "step": 30189 }, { "epoch": 0.82, "learning_rate": 1.572758668606582e-06, "loss": 1.3538, "step": 30190 }, { "epoch": 0.82, "learning_rate": 1.5722825309748436e-06, "loss": 1.1958, "step": 30191 }, { "epoch": 0.82, "learning_rate": 1.5718064592776061e-06, "loss": 1.2593, "step": 30192 }, { "epoch": 0.82, "learning_rate": 1.5713304535185914e-06, "loss": 1.3755, "step": 30193 }, { "epoch": 0.82, "learning_rate": 1.570854513701525e-06, "loss": 1.4292, "step": 30194 }, { "epoch": 0.82, "learning_rate": 1.5703786398301257e-06, "loss": 1.2355, "step": 30195 }, { "epoch": 0.82, "learning_rate": 1.56990283190812e-06, "loss": 1.2217, "step": 30196 }, { "epoch": 0.82, "learning_rate": 1.5694270899392362e-06, "loss": 1.2695, "step": 30197 }, { "epoch": 0.82, "learning_rate": 1.5689514139271855e-06, "loss": 1.1643, "step": 30198 }, { "epoch": 0.82, "learning_rate": 1.5684758038756964e-06, "loss": 1.271, "step": 30199 }, { "epoch": 0.82, "learning_rate": 1.5680002597884846e-06, "loss": 1.3096, "step": 30200 }, { "epoch": 0.82, "learning_rate": 1.5675247816692795e-06, "loss": 1.3503, "step": 30201 }, { "epoch": 0.82, "learning_rate": 1.5670493695217903e-06, "loss": 1.1624, "step": 30202 }, { "epoch": 0.82, "learning_rate": 1.566574023349744e-06, "loss": 1.1809, "step": 30203 }, { "epoch": 0.82, "learning_rate": 1.5660987431568541e-06, "loss": 1.1182, "step": 30204 }, { "epoch": 0.82, "learning_rate": 1.5656235289468468e-06, "loss": 1.2307, "step": 30205 }, { "epoch": 0.82, "learning_rate": 1.5651483807234303e-06, "loss": 1.2668, "step": 30206 }, { "epoch": 0.82, "learning_rate": 1.564673298490329e-06, "loss": 1.2729, "step": 30207 }, { "epoch": 0.82, "learning_rate": 1.5641982822512546e-06, "loss": 1.2834, "step": 30208 }, { "epoch": 0.82, "learning_rate": 1.563723332009931e-06, "loss": 1.0837, "step": 30209 }, { "epoch": 0.83, "learning_rate": 1.5632484477700637e-06, "loss": 1.1323, "step": 30210 }, { "epoch": 0.83, "learning_rate": 1.5627736295353757e-06, "loss": 1.3005, "step": 30211 }, { "epoch": 0.83, "learning_rate": 1.562298877309577e-06, "loss": 1.1089, "step": 30212 }, { "epoch": 0.83, "learning_rate": 1.5618241910963873e-06, "loss": 1.3345, "step": 30213 }, { "epoch": 0.83, "learning_rate": 1.5613495708995164e-06, "loss": 1.1848, "step": 30214 }, { "epoch": 0.83, "learning_rate": 1.560875016722676e-06, "loss": 1.2031, "step": 30215 }, { "epoch": 0.83, "learning_rate": 1.5604005285695845e-06, "loss": 1.145, "step": 30216 }, { "epoch": 0.83, "learning_rate": 1.5599261064439498e-06, "loss": 1.2065, "step": 30217 }, { "epoch": 0.83, "learning_rate": 1.5594517503494845e-06, "loss": 1.2242, "step": 30218 }, { "epoch": 0.83, "learning_rate": 1.5589774602898977e-06, "loss": 1.4053, "step": 30219 }, { "epoch": 0.83, "learning_rate": 1.5585032362689045e-06, "loss": 1.2397, "step": 30220 }, { "epoch": 0.83, "learning_rate": 1.5580290782902119e-06, "loss": 1.0991, "step": 30221 }, { "epoch": 0.83, "learning_rate": 1.5575549863575302e-06, "loss": 1.3049, "step": 30222 }, { "epoch": 0.83, "learning_rate": 1.5570809604745661e-06, "loss": 1.3596, "step": 30223 }, { "epoch": 0.83, "learning_rate": 1.556607000645033e-06, "loss": 1.1489, "step": 30224 }, { "epoch": 0.83, "learning_rate": 1.556133106872636e-06, "loss": 1.0996, "step": 30225 }, { "epoch": 0.83, "learning_rate": 1.5556592791610836e-06, "loss": 1.6792, "step": 30226 }, { "epoch": 0.83, "learning_rate": 1.5551855175140785e-06, "loss": 1.1865, "step": 30227 }, { "epoch": 0.83, "learning_rate": 1.5547118219353341e-06, "loss": 1.6548, "step": 30228 }, { "epoch": 0.83, "learning_rate": 1.5542381924285533e-06, "loss": 1.3193, "step": 30229 }, { "epoch": 0.83, "learning_rate": 1.5537646289974396e-06, "loss": 1.2078, "step": 30230 }, { "epoch": 0.83, "learning_rate": 1.5532911316457012e-06, "loss": 1.2573, "step": 30231 }, { "epoch": 0.83, "learning_rate": 1.5528177003770417e-06, "loss": 1.239, "step": 30232 }, { "epoch": 0.83, "learning_rate": 1.552344335195164e-06, "loss": 1.166, "step": 30233 }, { "epoch": 0.83, "learning_rate": 1.5518710361037693e-06, "loss": 1.3003, "step": 30234 }, { "epoch": 0.83, "learning_rate": 1.5513978031065657e-06, "loss": 1.4111, "step": 30235 }, { "epoch": 0.83, "learning_rate": 1.5509246362072527e-06, "loss": 1.178, "step": 30236 }, { "epoch": 0.83, "learning_rate": 1.5504515354095318e-06, "loss": 1.3252, "step": 30237 }, { "epoch": 0.83, "learning_rate": 1.549978500717103e-06, "loss": 1.0812, "step": 30238 }, { "epoch": 0.83, "learning_rate": 1.5495055321336716e-06, "loss": 1.4189, "step": 30239 }, { "epoch": 0.83, "learning_rate": 1.5490326296629344e-06, "loss": 1.3308, "step": 30240 }, { "epoch": 0.83, "learning_rate": 1.5485597933085928e-06, "loss": 1.1287, "step": 30241 }, { "epoch": 0.83, "learning_rate": 1.5480870230743427e-06, "loss": 1.3667, "step": 30242 }, { "epoch": 0.83, "learning_rate": 1.5476143189638848e-06, "loss": 1.3064, "step": 30243 }, { "epoch": 0.83, "learning_rate": 1.5471416809809236e-06, "loss": 1.1956, "step": 30244 }, { "epoch": 0.83, "learning_rate": 1.5466691091291452e-06, "loss": 1.3228, "step": 30245 }, { "epoch": 0.83, "learning_rate": 1.5461966034122556e-06, "loss": 1.2102, "step": 30246 }, { "epoch": 0.83, "learning_rate": 1.545724163833946e-06, "loss": 1.1472, "step": 30247 }, { "epoch": 0.83, "learning_rate": 1.5452517903979182e-06, "loss": 1.2803, "step": 30248 }, { "epoch": 0.83, "learning_rate": 1.5447794831078644e-06, "loss": 1.2019, "step": 30249 }, { "epoch": 0.83, "learning_rate": 1.5443072419674788e-06, "loss": 1.1881, "step": 30250 }, { "epoch": 0.83, "learning_rate": 1.5438350669804558e-06, "loss": 1.1804, "step": 30251 }, { "epoch": 0.83, "learning_rate": 1.5433629581504938e-06, "loss": 1.3347, "step": 30252 }, { "epoch": 0.83, "learning_rate": 1.542890915481282e-06, "loss": 1.1772, "step": 30253 }, { "epoch": 0.83, "learning_rate": 1.5424189389765165e-06, "loss": 1.1594, "step": 30254 }, { "epoch": 0.83, "learning_rate": 1.5419470286398842e-06, "loss": 1.2146, "step": 30255 }, { "epoch": 0.83, "learning_rate": 1.5414751844750842e-06, "loss": 1.2888, "step": 30256 }, { "epoch": 0.83, "learning_rate": 1.5410034064858048e-06, "loss": 1.3367, "step": 30257 }, { "epoch": 0.83, "learning_rate": 1.5405316946757355e-06, "loss": 1.4932, "step": 30258 }, { "epoch": 0.83, "learning_rate": 1.5400600490485696e-06, "loss": 1.2236, "step": 30259 }, { "epoch": 0.83, "learning_rate": 1.5395884696079954e-06, "loss": 1.3022, "step": 30260 }, { "epoch": 0.83, "learning_rate": 1.5391169563577036e-06, "loss": 1.4053, "step": 30261 }, { "epoch": 0.83, "learning_rate": 1.5386455093013796e-06, "loss": 1.1387, "step": 30262 }, { "epoch": 0.83, "learning_rate": 1.5381741284427165e-06, "loss": 1.0979, "step": 30263 }, { "epoch": 0.83, "learning_rate": 1.5377028137854e-06, "loss": 1.2549, "step": 30264 }, { "epoch": 0.83, "learning_rate": 1.5372315653331183e-06, "loss": 1.2368, "step": 30265 }, { "epoch": 0.83, "learning_rate": 1.5367603830895538e-06, "loss": 1.1714, "step": 30266 }, { "epoch": 0.83, "learning_rate": 1.5362892670583995e-06, "loss": 1.1702, "step": 30267 }, { "epoch": 0.83, "learning_rate": 1.5358182172433368e-06, "loss": 1.4526, "step": 30268 }, { "epoch": 0.83, "learning_rate": 1.5353472336480535e-06, "loss": 1.2542, "step": 30269 }, { "epoch": 0.83, "learning_rate": 1.5348763162762303e-06, "loss": 1.3621, "step": 30270 }, { "epoch": 0.83, "learning_rate": 1.5344054651315566e-06, "loss": 1.1836, "step": 30271 }, { "epoch": 0.83, "learning_rate": 1.5339346802177136e-06, "loss": 1.1509, "step": 30272 }, { "epoch": 0.83, "learning_rate": 1.533463961538385e-06, "loss": 1.2449, "step": 30273 }, { "epoch": 0.83, "learning_rate": 1.5329933090972503e-06, "loss": 1.2476, "step": 30274 }, { "epoch": 0.83, "learning_rate": 1.5325227228979978e-06, "loss": 1.2407, "step": 30275 }, { "epoch": 0.83, "learning_rate": 1.532052202944304e-06, "loss": 1.0829, "step": 30276 }, { "epoch": 0.83, "learning_rate": 1.531581749239851e-06, "loss": 1.3525, "step": 30277 }, { "epoch": 0.83, "learning_rate": 1.5311113617883222e-06, "loss": 1.2329, "step": 30278 }, { "epoch": 0.83, "learning_rate": 1.5306410405933957e-06, "loss": 1.1982, "step": 30279 }, { "epoch": 0.83, "learning_rate": 1.5301707856587521e-06, "loss": 1.2966, "step": 30280 }, { "epoch": 0.83, "learning_rate": 1.5297005969880662e-06, "loss": 1.4153, "step": 30281 }, { "epoch": 0.83, "learning_rate": 1.5292304745850216e-06, "loss": 1.2874, "step": 30282 }, { "epoch": 0.83, "learning_rate": 1.5287604184532934e-06, "loss": 1.2765, "step": 30283 }, { "epoch": 0.83, "learning_rate": 1.5282904285965639e-06, "loss": 1.2307, "step": 30284 }, { "epoch": 0.83, "learning_rate": 1.5278205050185023e-06, "loss": 1.3193, "step": 30285 }, { "epoch": 0.83, "learning_rate": 1.5273506477227916e-06, "loss": 1.1462, "step": 30286 }, { "epoch": 0.83, "learning_rate": 1.5268808567131022e-06, "loss": 1.7461, "step": 30287 }, { "epoch": 0.83, "learning_rate": 1.5264111319931185e-06, "loss": 1.3752, "step": 30288 }, { "epoch": 0.83, "learning_rate": 1.5259414735665035e-06, "loss": 1.3445, "step": 30289 }, { "epoch": 0.83, "learning_rate": 1.5254718814369386e-06, "loss": 1.2217, "step": 30290 }, { "epoch": 0.83, "learning_rate": 1.5250023556080985e-06, "loss": 1.1807, "step": 30291 }, { "epoch": 0.83, "learning_rate": 1.5245328960836548e-06, "loss": 1.2163, "step": 30292 }, { "epoch": 0.83, "learning_rate": 1.5240635028672812e-06, "loss": 1.2913, "step": 30293 }, { "epoch": 0.83, "learning_rate": 1.523594175962646e-06, "loss": 1.1592, "step": 30294 }, { "epoch": 0.83, "learning_rate": 1.5231249153734263e-06, "loss": 1.2866, "step": 30295 }, { "epoch": 0.83, "learning_rate": 1.522655721103291e-06, "loss": 1.3403, "step": 30296 }, { "epoch": 0.83, "learning_rate": 1.522186593155911e-06, "loss": 1.2385, "step": 30297 }, { "epoch": 0.83, "learning_rate": 1.5217175315349552e-06, "loss": 1.6963, "step": 30298 }, { "epoch": 0.83, "learning_rate": 1.5212485362440965e-06, "loss": 1.0894, "step": 30299 }, { "epoch": 0.83, "learning_rate": 1.5207796072870018e-06, "loss": 1.3071, "step": 30300 }, { "epoch": 0.83, "learning_rate": 1.5203107446673405e-06, "loss": 1.1709, "step": 30301 }, { "epoch": 0.83, "learning_rate": 1.5198419483887783e-06, "loss": 1.2861, "step": 30302 }, { "epoch": 0.83, "learning_rate": 1.519373218454987e-06, "loss": 1.2754, "step": 30303 }, { "epoch": 0.83, "learning_rate": 1.5189045548696324e-06, "loss": 1.3103, "step": 30304 }, { "epoch": 0.83, "learning_rate": 1.5184359576363772e-06, "loss": 1.0747, "step": 30305 }, { "epoch": 0.83, "learning_rate": 1.517967426758894e-06, "loss": 1.2651, "step": 30306 }, { "epoch": 0.83, "learning_rate": 1.5174989622408453e-06, "loss": 1.3081, "step": 30307 }, { "epoch": 0.83, "learning_rate": 1.517030564085895e-06, "loss": 1.2856, "step": 30308 }, { "epoch": 0.83, "learning_rate": 1.516562232297707e-06, "loss": 1.364, "step": 30309 }, { "epoch": 0.83, "learning_rate": 1.516093966879949e-06, "loss": 1.1892, "step": 30310 }, { "epoch": 0.83, "learning_rate": 1.5156257678362817e-06, "loss": 1.2097, "step": 30311 }, { "epoch": 0.83, "learning_rate": 1.5151576351703702e-06, "loss": 1.3271, "step": 30312 }, { "epoch": 0.83, "learning_rate": 1.514689568885872e-06, "loss": 1.1731, "step": 30313 }, { "epoch": 0.83, "learning_rate": 1.514221568986456e-06, "loss": 1.2605, "step": 30314 }, { "epoch": 0.83, "learning_rate": 1.5137536354757787e-06, "loss": 1.3992, "step": 30315 }, { "epoch": 0.83, "learning_rate": 1.513285768357503e-06, "loss": 1.3018, "step": 30316 }, { "epoch": 0.83, "learning_rate": 1.5128179676352872e-06, "loss": 1.3013, "step": 30317 }, { "epoch": 0.83, "learning_rate": 1.5123502333127937e-06, "loss": 1.2808, "step": 30318 }, { "epoch": 0.83, "learning_rate": 1.511882565393682e-06, "loss": 1.2771, "step": 30319 }, { "epoch": 0.83, "learning_rate": 1.5114149638816067e-06, "loss": 1.2451, "step": 30320 }, { "epoch": 0.83, "learning_rate": 1.5109474287802318e-06, "loss": 1.2009, "step": 30321 }, { "epoch": 0.83, "learning_rate": 1.5104799600932095e-06, "loss": 1.2666, "step": 30322 }, { "epoch": 0.83, "learning_rate": 1.5100125578242053e-06, "loss": 1.2073, "step": 30323 }, { "epoch": 0.83, "learning_rate": 1.5095452219768646e-06, "loss": 1.186, "step": 30324 }, { "epoch": 0.83, "learning_rate": 1.5090779525548537e-06, "loss": 1.229, "step": 30325 }, { "epoch": 0.83, "learning_rate": 1.5086107495618208e-06, "loss": 1.3474, "step": 30326 }, { "epoch": 0.83, "learning_rate": 1.5081436130014293e-06, "loss": 1.29, "step": 30327 }, { "epoch": 0.83, "learning_rate": 1.5076765428773243e-06, "loss": 1.0135, "step": 30328 }, { "epoch": 0.83, "learning_rate": 1.5072095391931673e-06, "loss": 1.2493, "step": 30329 }, { "epoch": 0.83, "learning_rate": 1.5067426019526067e-06, "loss": 1.2098, "step": 30330 }, { "epoch": 0.83, "learning_rate": 1.5062757311593024e-06, "loss": 1.3064, "step": 30331 }, { "epoch": 0.83, "learning_rate": 1.5058089268168985e-06, "loss": 1.1621, "step": 30332 }, { "epoch": 0.83, "learning_rate": 1.5053421889290543e-06, "loss": 1.3149, "step": 30333 }, { "epoch": 0.83, "learning_rate": 1.5048755174994144e-06, "loss": 1.2546, "step": 30334 }, { "epoch": 0.83, "learning_rate": 1.5044089125316397e-06, "loss": 1.4282, "step": 30335 }, { "epoch": 0.83, "learning_rate": 1.5039423740293701e-06, "loss": 1.3162, "step": 30336 }, { "epoch": 0.83, "learning_rate": 1.5034759019962596e-06, "loss": 1.312, "step": 30337 }, { "epoch": 0.83, "learning_rate": 1.5030094964359609e-06, "loss": 1.3225, "step": 30338 }, { "epoch": 0.83, "learning_rate": 1.5025431573521209e-06, "loss": 1.3049, "step": 30339 }, { "epoch": 0.83, "learning_rate": 1.5020768847483868e-06, "loss": 1.27, "step": 30340 }, { "epoch": 0.83, "learning_rate": 1.5016106786284046e-06, "loss": 1.3064, "step": 30341 }, { "epoch": 0.83, "learning_rate": 1.501144538995828e-06, "loss": 1.3149, "step": 30342 }, { "epoch": 0.83, "learning_rate": 1.5006784658542984e-06, "loss": 1.3049, "step": 30343 }, { "epoch": 0.83, "learning_rate": 1.500212459207464e-06, "loss": 1.2114, "step": 30344 }, { "epoch": 0.83, "learning_rate": 1.4997465190589688e-06, "loss": 1.3093, "step": 30345 }, { "epoch": 0.83, "learning_rate": 1.499280645412462e-06, "loss": 1.2593, "step": 30346 }, { "epoch": 0.83, "learning_rate": 1.498814838271586e-06, "loss": 1.1348, "step": 30347 }, { "epoch": 0.83, "learning_rate": 1.498349097639985e-06, "loss": 1.2812, "step": 30348 }, { "epoch": 0.83, "learning_rate": 1.4978834235213013e-06, "loss": 1.1992, "step": 30349 }, { "epoch": 0.83, "learning_rate": 1.497417815919181e-06, "loss": 1.6677, "step": 30350 }, { "epoch": 0.83, "learning_rate": 1.4969522748372655e-06, "loss": 1.4026, "step": 30351 }, { "epoch": 0.83, "learning_rate": 1.4964868002791954e-06, "loss": 1.2244, "step": 30352 }, { "epoch": 0.83, "learning_rate": 1.4960213922486167e-06, "loss": 1.2083, "step": 30353 }, { "epoch": 0.83, "learning_rate": 1.4955560507491663e-06, "loss": 1.2004, "step": 30354 }, { "epoch": 0.83, "learning_rate": 1.4950907757844867e-06, "loss": 1.1531, "step": 30355 }, { "epoch": 0.83, "learning_rate": 1.4946255673582165e-06, "loss": 1.2627, "step": 30356 }, { "epoch": 0.83, "learning_rate": 1.4941604254739972e-06, "loss": 1.2583, "step": 30357 }, { "epoch": 0.83, "learning_rate": 1.493695350135468e-06, "loss": 1.2349, "step": 30358 }, { "epoch": 0.83, "learning_rate": 1.4932303413462656e-06, "loss": 1.1328, "step": 30359 }, { "epoch": 0.83, "learning_rate": 1.4927653991100267e-06, "loss": 1.365, "step": 30360 }, { "epoch": 0.83, "learning_rate": 1.4923005234303933e-06, "loss": 1.2532, "step": 30361 }, { "epoch": 0.83, "learning_rate": 1.4918357143110007e-06, "loss": 1.23, "step": 30362 }, { "epoch": 0.83, "learning_rate": 1.4913709717554836e-06, "loss": 1.1938, "step": 30363 }, { "epoch": 0.83, "learning_rate": 1.490906295767478e-06, "loss": 1.6602, "step": 30364 }, { "epoch": 0.83, "learning_rate": 1.490441686350621e-06, "loss": 1.3699, "step": 30365 }, { "epoch": 0.83, "learning_rate": 1.4899771435085485e-06, "loss": 1.2632, "step": 30366 }, { "epoch": 0.83, "learning_rate": 1.4895126672448889e-06, "loss": 1.2837, "step": 30367 }, { "epoch": 0.83, "learning_rate": 1.4890482575632836e-06, "loss": 1.7246, "step": 30368 }, { "epoch": 0.83, "learning_rate": 1.488583914467361e-06, "loss": 1.2954, "step": 30369 }, { "epoch": 0.83, "learning_rate": 1.4881196379607587e-06, "loss": 1.2803, "step": 30370 }, { "epoch": 0.83, "learning_rate": 1.4876554280471023e-06, "loss": 1.321, "step": 30371 }, { "epoch": 0.83, "learning_rate": 1.4871912847300285e-06, "loss": 1.3342, "step": 30372 }, { "epoch": 0.83, "learning_rate": 1.4867272080131655e-06, "loss": 1.2412, "step": 30373 }, { "epoch": 0.83, "learning_rate": 1.4862631979001496e-06, "loss": 1.3787, "step": 30374 }, { "epoch": 0.83, "learning_rate": 1.485799254394603e-06, "loss": 1.1838, "step": 30375 }, { "epoch": 0.83, "learning_rate": 1.4853353775001612e-06, "loss": 1.3252, "step": 30376 }, { "epoch": 0.83, "learning_rate": 1.4848715672204495e-06, "loss": 1.2261, "step": 30377 }, { "epoch": 0.83, "learning_rate": 1.484407823559103e-06, "loss": 1.2913, "step": 30378 }, { "epoch": 0.83, "learning_rate": 1.4839441465197413e-06, "loss": 1.312, "step": 30379 }, { "epoch": 0.83, "learning_rate": 1.4834805361059979e-06, "loss": 1.3083, "step": 30380 }, { "epoch": 0.83, "learning_rate": 1.4830169923214954e-06, "loss": 1.26, "step": 30381 }, { "epoch": 0.83, "learning_rate": 1.4825535151698655e-06, "loss": 1.2776, "step": 30382 }, { "epoch": 0.83, "learning_rate": 1.482090104654732e-06, "loss": 1.3401, "step": 30383 }, { "epoch": 0.83, "learning_rate": 1.4816267607797176e-06, "loss": 1.269, "step": 30384 }, { "epoch": 0.83, "learning_rate": 1.4811634835484522e-06, "loss": 1.2656, "step": 30385 }, { "epoch": 0.83, "learning_rate": 1.4807002729645581e-06, "loss": 1.1018, "step": 30386 }, { "epoch": 0.83, "learning_rate": 1.4802371290316586e-06, "loss": 1.3767, "step": 30387 }, { "epoch": 0.83, "learning_rate": 1.4797740517533755e-06, "loss": 1.2581, "step": 30388 }, { "epoch": 0.83, "learning_rate": 1.4793110411333356e-06, "loss": 1.2307, "step": 30389 }, { "epoch": 0.83, "learning_rate": 1.4788480971751594e-06, "loss": 1.377, "step": 30390 }, { "epoch": 0.83, "learning_rate": 1.47838521988247e-06, "loss": 1.3098, "step": 30391 }, { "epoch": 0.83, "learning_rate": 1.477922409258884e-06, "loss": 1.3823, "step": 30392 }, { "epoch": 0.83, "learning_rate": 1.4774596653080286e-06, "loss": 1.1562, "step": 30393 }, { "epoch": 0.83, "learning_rate": 1.47699698803352e-06, "loss": 1.3479, "step": 30394 }, { "epoch": 0.83, "learning_rate": 1.4765343774389806e-06, "loss": 1.1702, "step": 30395 }, { "epoch": 0.83, "learning_rate": 1.4760718335280255e-06, "loss": 1.376, "step": 30396 }, { "epoch": 0.83, "learning_rate": 1.4756093563042783e-06, "loss": 1.209, "step": 30397 }, { "epoch": 0.83, "learning_rate": 1.4751469457713552e-06, "loss": 1.2422, "step": 30398 }, { "epoch": 0.83, "learning_rate": 1.4746846019328708e-06, "loss": 1.2681, "step": 30399 }, { "epoch": 0.83, "learning_rate": 1.4742223247924481e-06, "loss": 1.4124, "step": 30400 }, { "epoch": 0.83, "learning_rate": 1.4737601143537006e-06, "loss": 1.3235, "step": 30401 }, { "epoch": 0.83, "learning_rate": 1.4732979706202443e-06, "loss": 1.1775, "step": 30402 }, { "epoch": 0.83, "learning_rate": 1.4728358935956933e-06, "loss": 1.21, "step": 30403 }, { "epoch": 0.83, "learning_rate": 1.4723738832836666e-06, "loss": 1.2554, "step": 30404 }, { "epoch": 0.83, "learning_rate": 1.4719119396877768e-06, "loss": 1.1902, "step": 30405 }, { "epoch": 0.83, "learning_rate": 1.471450062811638e-06, "loss": 1.2869, "step": 30406 }, { "epoch": 0.83, "learning_rate": 1.4709882526588615e-06, "loss": 1.2998, "step": 30407 }, { "epoch": 0.83, "learning_rate": 1.4705265092330646e-06, "loss": 1.2485, "step": 30408 }, { "epoch": 0.83, "learning_rate": 1.4700648325378564e-06, "loss": 1.2222, "step": 30409 }, { "epoch": 0.83, "learning_rate": 1.4696032225768507e-06, "loss": 1.1951, "step": 30410 }, { "epoch": 0.83, "learning_rate": 1.469141679353655e-06, "loss": 1.2844, "step": 30411 }, { "epoch": 0.83, "learning_rate": 1.4686802028718861e-06, "loss": 1.1182, "step": 30412 }, { "epoch": 0.83, "learning_rate": 1.4682187931351522e-06, "loss": 1.3071, "step": 30413 }, { "epoch": 0.83, "learning_rate": 1.4677574501470593e-06, "loss": 1.2808, "step": 30414 }, { "epoch": 0.83, "learning_rate": 1.4672961739112235e-06, "loss": 1.2573, "step": 30415 }, { "epoch": 0.83, "learning_rate": 1.4668349644312464e-06, "loss": 1.2903, "step": 30416 }, { "epoch": 0.83, "learning_rate": 1.4663738217107448e-06, "loss": 1.1833, "step": 30417 }, { "epoch": 0.83, "learning_rate": 1.4659127457533174e-06, "loss": 1.3137, "step": 30418 }, { "epoch": 0.83, "learning_rate": 1.4654517365625786e-06, "loss": 1.1067, "step": 30419 }, { "epoch": 0.83, "learning_rate": 1.4649907941421294e-06, "loss": 1.2722, "step": 30420 }, { "epoch": 0.83, "learning_rate": 1.4645299184955831e-06, "loss": 1.1825, "step": 30421 }, { "epoch": 0.83, "learning_rate": 1.4640691096265358e-06, "loss": 1.3101, "step": 30422 }, { "epoch": 0.83, "learning_rate": 1.4636083675386014e-06, "loss": 1.4065, "step": 30423 }, { "epoch": 0.83, "learning_rate": 1.4631476922353782e-06, "loss": 1.2671, "step": 30424 }, { "epoch": 0.83, "learning_rate": 1.4626870837204776e-06, "loss": 1.2739, "step": 30425 }, { "epoch": 0.83, "learning_rate": 1.4622265419974946e-06, "loss": 1.0981, "step": 30426 }, { "epoch": 0.83, "learning_rate": 1.4617660670700384e-06, "loss": 1.2366, "step": 30427 }, { "epoch": 0.83, "learning_rate": 1.4613056589417074e-06, "loss": 1.2002, "step": 30428 }, { "epoch": 0.83, "learning_rate": 1.4608453176161074e-06, "loss": 1.2916, "step": 30429 }, { "epoch": 0.83, "learning_rate": 1.4603850430968392e-06, "loss": 1.2612, "step": 30430 }, { "epoch": 0.83, "learning_rate": 1.4599248353874995e-06, "loss": 1.2219, "step": 30431 }, { "epoch": 0.83, "learning_rate": 1.4594646944916956e-06, "loss": 1.3271, "step": 30432 }, { "epoch": 0.83, "learning_rate": 1.4590046204130225e-06, "loss": 1.3586, "step": 30433 }, { "epoch": 0.83, "learning_rate": 1.4585446131550818e-06, "loss": 1.0864, "step": 30434 }, { "epoch": 0.83, "learning_rate": 1.4580846727214692e-06, "loss": 1.3298, "step": 30435 }, { "epoch": 0.83, "learning_rate": 1.4576247991157876e-06, "loss": 1.1953, "step": 30436 }, { "epoch": 0.83, "learning_rate": 1.457164992341633e-06, "loss": 1.1145, "step": 30437 }, { "epoch": 0.83, "learning_rate": 1.4567052524026025e-06, "loss": 1.3596, "step": 30438 }, { "epoch": 0.83, "learning_rate": 1.45624557930229e-06, "loss": 1.1792, "step": 30439 }, { "epoch": 0.83, "learning_rate": 1.455785973044297e-06, "loss": 1.1548, "step": 30440 }, { "epoch": 0.83, "learning_rate": 1.455326433632217e-06, "loss": 1.1528, "step": 30441 }, { "epoch": 0.83, "learning_rate": 1.4548669610696443e-06, "loss": 1.2695, "step": 30442 }, { "epoch": 0.83, "learning_rate": 1.4544075553601732e-06, "loss": 1.0822, "step": 30443 }, { "epoch": 0.83, "learning_rate": 1.4539482165074004e-06, "loss": 1.4104, "step": 30444 }, { "epoch": 0.83, "learning_rate": 1.4534889445149182e-06, "loss": 1.4287, "step": 30445 }, { "epoch": 0.83, "learning_rate": 1.4530297393863168e-06, "loss": 1.4299, "step": 30446 }, { "epoch": 0.83, "learning_rate": 1.452570601125195e-06, "loss": 1.3398, "step": 30447 }, { "epoch": 0.83, "learning_rate": 1.4521115297351408e-06, "loss": 1.1953, "step": 30448 }, { "epoch": 0.83, "learning_rate": 1.4516525252197467e-06, "loss": 1.1946, "step": 30449 }, { "epoch": 0.83, "learning_rate": 1.451193587582601e-06, "loss": 1.354, "step": 30450 }, { "epoch": 0.83, "learning_rate": 1.4507347168273001e-06, "loss": 1.2354, "step": 30451 }, { "epoch": 0.83, "learning_rate": 1.4502759129574295e-06, "loss": 1.1902, "step": 30452 }, { "epoch": 0.83, "learning_rate": 1.44981717597658e-06, "loss": 1.2771, "step": 30453 }, { "epoch": 0.83, "learning_rate": 1.4493585058883387e-06, "loss": 1.2495, "step": 30454 }, { "epoch": 0.83, "learning_rate": 1.448899902696297e-06, "loss": 1.2736, "step": 30455 }, { "epoch": 0.83, "learning_rate": 1.448441366404042e-06, "loss": 1.3435, "step": 30456 }, { "epoch": 0.83, "learning_rate": 1.4479828970151598e-06, "loss": 1.2278, "step": 30457 }, { "epoch": 0.83, "learning_rate": 1.4475244945332367e-06, "loss": 1.2458, "step": 30458 }, { "epoch": 0.83, "learning_rate": 1.4470661589618617e-06, "loss": 1.1702, "step": 30459 }, { "epoch": 0.83, "learning_rate": 1.4466078903046198e-06, "loss": 1.2532, "step": 30460 }, { "epoch": 0.83, "learning_rate": 1.4461496885650938e-06, "loss": 1.1887, "step": 30461 }, { "epoch": 0.83, "learning_rate": 1.4456915537468719e-06, "loss": 1.2461, "step": 30462 }, { "epoch": 0.83, "learning_rate": 1.4452334858535343e-06, "loss": 1.2346, "step": 30463 }, { "epoch": 0.83, "learning_rate": 1.444775484888672e-06, "loss": 1.2351, "step": 30464 }, { "epoch": 0.83, "learning_rate": 1.4443175508558593e-06, "loss": 1.2676, "step": 30465 }, { "epoch": 0.83, "learning_rate": 1.443859683758685e-06, "loss": 1.2778, "step": 30466 }, { "epoch": 0.83, "learning_rate": 1.443401883600727e-06, "loss": 1.2964, "step": 30467 }, { "epoch": 0.83, "learning_rate": 1.4429441503855724e-06, "loss": 1.3008, "step": 30468 }, { "epoch": 0.83, "learning_rate": 1.442486484116795e-06, "loss": 1.2864, "step": 30469 }, { "epoch": 0.83, "learning_rate": 1.4420288847979824e-06, "loss": 1.3501, "step": 30470 }, { "epoch": 0.83, "learning_rate": 1.441571352432709e-06, "loss": 1.1814, "step": 30471 }, { "epoch": 0.83, "learning_rate": 1.4411138870245611e-06, "loss": 1.2236, "step": 30472 }, { "epoch": 0.83, "learning_rate": 1.4406564885771091e-06, "loss": 1.2222, "step": 30473 }, { "epoch": 0.83, "learning_rate": 1.4401991570939379e-06, "loss": 1.1475, "step": 30474 }, { "epoch": 0.83, "learning_rate": 1.439741892578621e-06, "loss": 1.1877, "step": 30475 }, { "epoch": 0.83, "learning_rate": 1.4392846950347417e-06, "loss": 1.4321, "step": 30476 }, { "epoch": 0.83, "learning_rate": 1.4388275644658723e-06, "loss": 1.281, "step": 30477 }, { "epoch": 0.83, "learning_rate": 1.4383705008755877e-06, "loss": 1.1436, "step": 30478 }, { "epoch": 0.83, "learning_rate": 1.4379135042674696e-06, "loss": 1.3091, "step": 30479 }, { "epoch": 0.83, "learning_rate": 1.4374565746450897e-06, "loss": 1.2683, "step": 30480 }, { "epoch": 0.83, "learning_rate": 1.4369997120120228e-06, "loss": 1.1655, "step": 30481 }, { "epoch": 0.83, "learning_rate": 1.4365429163718415e-06, "loss": 1.2686, "step": 30482 }, { "epoch": 0.83, "learning_rate": 1.436086187728124e-06, "loss": 1.2878, "step": 30483 }, { "epoch": 0.83, "learning_rate": 1.4356295260844412e-06, "loss": 1.2319, "step": 30484 }, { "epoch": 0.83, "learning_rate": 1.4351729314443651e-06, "loss": 1.2996, "step": 30485 }, { "epoch": 0.83, "learning_rate": 1.434716403811467e-06, "loss": 1.3132, "step": 30486 }, { "epoch": 0.83, "learning_rate": 1.4342599431893223e-06, "loss": 1.2397, "step": 30487 }, { "epoch": 0.83, "learning_rate": 1.4338035495814996e-06, "loss": 1.3608, "step": 30488 }, { "epoch": 0.83, "learning_rate": 1.433347222991569e-06, "loss": 1.1685, "step": 30489 }, { "epoch": 0.83, "learning_rate": 1.4328909634231004e-06, "loss": 1.2871, "step": 30490 }, { "epoch": 0.83, "learning_rate": 1.432434770879666e-06, "loss": 1.2004, "step": 30491 }, { "epoch": 0.83, "learning_rate": 1.4319786453648344e-06, "loss": 1.2695, "step": 30492 }, { "epoch": 0.83, "learning_rate": 1.431522586882169e-06, "loss": 1.3518, "step": 30493 }, { "epoch": 0.83, "learning_rate": 1.4310665954352443e-06, "loss": 1.3984, "step": 30494 }, { "epoch": 0.83, "learning_rate": 1.4306106710276257e-06, "loss": 1.1638, "step": 30495 }, { "epoch": 0.83, "learning_rate": 1.4301548136628795e-06, "loss": 1.324, "step": 30496 }, { "epoch": 0.83, "learning_rate": 1.4296990233445696e-06, "loss": 1.2708, "step": 30497 }, { "epoch": 0.83, "learning_rate": 1.4292433000762672e-06, "loss": 1.29, "step": 30498 }, { "epoch": 0.83, "learning_rate": 1.4287876438615356e-06, "loss": 1.1963, "step": 30499 }, { "epoch": 0.83, "learning_rate": 1.4283320547039381e-06, "loss": 1.2603, "step": 30500 }, { "epoch": 0.83, "learning_rate": 1.4278765326070377e-06, "loss": 1.2563, "step": 30501 }, { "epoch": 0.83, "learning_rate": 1.4274210775744025e-06, "loss": 1.2456, "step": 30502 }, { "epoch": 0.83, "learning_rate": 1.426965689609594e-06, "loss": 1.1079, "step": 30503 }, { "epoch": 0.83, "learning_rate": 1.4265103687161741e-06, "loss": 1.1411, "step": 30504 }, { "epoch": 0.83, "learning_rate": 1.4260551148977042e-06, "loss": 1.2561, "step": 30505 }, { "epoch": 0.83, "learning_rate": 1.4255999281577492e-06, "loss": 1.2676, "step": 30506 }, { "epoch": 0.83, "learning_rate": 1.4251448084998687e-06, "loss": 1.1455, "step": 30507 }, { "epoch": 0.83, "learning_rate": 1.4246897559276195e-06, "loss": 1.2544, "step": 30508 }, { "epoch": 0.83, "learning_rate": 1.4242347704445692e-06, "loss": 1.2236, "step": 30509 }, { "epoch": 0.83, "learning_rate": 1.42377985205427e-06, "loss": 1.2388, "step": 30510 }, { "epoch": 0.83, "learning_rate": 1.4233250007602873e-06, "loss": 1.4187, "step": 30511 }, { "epoch": 0.83, "learning_rate": 1.4228702165661766e-06, "loss": 1.6562, "step": 30512 }, { "epoch": 0.83, "learning_rate": 1.4224154994754956e-06, "loss": 1.3481, "step": 30513 }, { "epoch": 0.83, "learning_rate": 1.4219608494918003e-06, "loss": 1.2432, "step": 30514 }, { "epoch": 0.83, "learning_rate": 1.4215062666186518e-06, "loss": 1.2498, "step": 30515 }, { "epoch": 0.83, "learning_rate": 1.4210517508596045e-06, "loss": 1.355, "step": 30516 }, { "epoch": 0.83, "learning_rate": 1.4205973022182151e-06, "loss": 1.3572, "step": 30517 }, { "epoch": 0.83, "learning_rate": 1.4201429206980344e-06, "loss": 1.2075, "step": 30518 }, { "epoch": 0.83, "learning_rate": 1.4196886063026238e-06, "loss": 1.2239, "step": 30519 }, { "epoch": 0.83, "learning_rate": 1.419234359035535e-06, "loss": 1.2173, "step": 30520 }, { "epoch": 0.83, "learning_rate": 1.4187801789003219e-06, "loss": 1.2715, "step": 30521 }, { "epoch": 0.83, "learning_rate": 1.418326065900535e-06, "loss": 1.1758, "step": 30522 }, { "epoch": 0.83, "learning_rate": 1.417872020039731e-06, "loss": 1.2805, "step": 30523 }, { "epoch": 0.83, "learning_rate": 1.4174180413214612e-06, "loss": 1.123, "step": 30524 }, { "epoch": 0.83, "learning_rate": 1.4169641297492753e-06, "loss": 1.3953, "step": 30525 }, { "epoch": 0.83, "learning_rate": 1.4165102853267276e-06, "loss": 1.3027, "step": 30526 }, { "epoch": 0.83, "learning_rate": 1.4160565080573673e-06, "loss": 1.2969, "step": 30527 }, { "epoch": 0.83, "learning_rate": 1.415602797944744e-06, "loss": 1.3369, "step": 30528 }, { "epoch": 0.83, "learning_rate": 1.4151491549924056e-06, "loss": 1.2273, "step": 30529 }, { "epoch": 0.83, "learning_rate": 1.4146955792039064e-06, "loss": 1.3025, "step": 30530 }, { "epoch": 0.83, "learning_rate": 1.414242070582791e-06, "loss": 1.2505, "step": 30531 }, { "epoch": 0.83, "learning_rate": 1.4137886291326086e-06, "loss": 1.3282, "step": 30532 }, { "epoch": 0.83, "learning_rate": 1.4133352548569046e-06, "loss": 1.158, "step": 30533 }, { "epoch": 0.83, "learning_rate": 1.4128819477592292e-06, "loss": 1.165, "step": 30534 }, { "epoch": 0.83, "learning_rate": 1.4124287078431286e-06, "loss": 1.2659, "step": 30535 }, { "epoch": 0.83, "learning_rate": 1.4119755351121466e-06, "loss": 1.3616, "step": 30536 }, { "epoch": 0.83, "learning_rate": 1.4115224295698282e-06, "loss": 1.2917, "step": 30537 }, { "epoch": 0.83, "learning_rate": 1.4110693912197216e-06, "loss": 1.1304, "step": 30538 }, { "epoch": 0.83, "learning_rate": 1.4106164200653693e-06, "loss": 1.3, "step": 30539 }, { "epoch": 0.83, "learning_rate": 1.4101635161103134e-06, "loss": 1.3062, "step": 30540 }, { "epoch": 0.83, "learning_rate": 1.4097106793581007e-06, "loss": 1.2793, "step": 30541 }, { "epoch": 0.83, "learning_rate": 1.4092579098122717e-06, "loss": 1.1438, "step": 30542 }, { "epoch": 0.83, "learning_rate": 1.4088052074763704e-06, "loss": 1.1694, "step": 30543 }, { "epoch": 0.83, "learning_rate": 1.4083525723539338e-06, "loss": 1.1419, "step": 30544 }, { "epoch": 0.83, "learning_rate": 1.4079000044485091e-06, "loss": 1.2295, "step": 30545 }, { "epoch": 0.83, "learning_rate": 1.4074475037636325e-06, "loss": 1.3059, "step": 30546 }, { "epoch": 0.83, "learning_rate": 1.4069950703028513e-06, "loss": 1.2695, "step": 30547 }, { "epoch": 0.83, "learning_rate": 1.4065427040696944e-06, "loss": 1.229, "step": 30548 }, { "epoch": 0.83, "learning_rate": 1.4060904050677093e-06, "loss": 1.2534, "step": 30549 }, { "epoch": 0.83, "learning_rate": 1.4056381733004286e-06, "loss": 1.1191, "step": 30550 }, { "epoch": 0.83, "learning_rate": 1.4051860087713986e-06, "loss": 1.3105, "step": 30551 }, { "epoch": 0.83, "learning_rate": 1.4047339114841475e-06, "loss": 1.3113, "step": 30552 }, { "epoch": 0.83, "learning_rate": 1.4042818814422165e-06, "loss": 1.2642, "step": 30553 }, { "epoch": 0.83, "learning_rate": 1.4038299186491444e-06, "loss": 1.2795, "step": 30554 }, { "epoch": 0.83, "learning_rate": 1.4033780231084636e-06, "loss": 1.0588, "step": 30555 }, { "epoch": 0.83, "learning_rate": 1.4029261948237117e-06, "loss": 1.1504, "step": 30556 }, { "epoch": 0.83, "learning_rate": 1.402474433798421e-06, "loss": 1.1821, "step": 30557 }, { "epoch": 0.83, "learning_rate": 1.4020227400361287e-06, "loss": 1.3604, "step": 30558 }, { "epoch": 0.83, "learning_rate": 1.4015711135403676e-06, "loss": 1.2837, "step": 30559 }, { "epoch": 0.83, "learning_rate": 1.4011195543146704e-06, "loss": 1.2805, "step": 30560 }, { "epoch": 0.83, "learning_rate": 1.400668062362569e-06, "loss": 1.1792, "step": 30561 }, { "epoch": 0.83, "learning_rate": 1.4002166376875992e-06, "loss": 1.2009, "step": 30562 }, { "epoch": 0.83, "learning_rate": 1.3997652802932904e-06, "loss": 1.2539, "step": 30563 }, { "epoch": 0.83, "learning_rate": 1.3993139901831732e-06, "loss": 1.2661, "step": 30564 }, { "epoch": 0.83, "learning_rate": 1.398862767360778e-06, "loss": 1.2158, "step": 30565 }, { "epoch": 0.83, "learning_rate": 1.3984116118296375e-06, "loss": 1.2695, "step": 30566 }, { "epoch": 0.83, "learning_rate": 1.397960523593279e-06, "loss": 1.3245, "step": 30567 }, { "epoch": 0.83, "learning_rate": 1.3975095026552333e-06, "loss": 1.228, "step": 30568 }, { "epoch": 0.83, "learning_rate": 1.3970585490190259e-06, "loss": 1.2297, "step": 30569 }, { "epoch": 0.83, "learning_rate": 1.3966076626881897e-06, "loss": 1.228, "step": 30570 }, { "epoch": 0.83, "learning_rate": 1.3961568436662487e-06, "loss": 1.2617, "step": 30571 }, { "epoch": 0.83, "learning_rate": 1.3957060919567288e-06, "loss": 1.1335, "step": 30572 }, { "epoch": 0.83, "learning_rate": 1.3952554075631608e-06, "loss": 1.1934, "step": 30573 }, { "epoch": 0.83, "learning_rate": 1.3948047904890683e-06, "loss": 1.2375, "step": 30574 }, { "epoch": 0.83, "learning_rate": 1.3943542407379761e-06, "loss": 1.3643, "step": 30575 }, { "epoch": 0.84, "learning_rate": 1.3939037583134075e-06, "loss": 1.2671, "step": 30576 }, { "epoch": 0.84, "learning_rate": 1.3934533432188912e-06, "loss": 1.3276, "step": 30577 }, { "epoch": 0.84, "learning_rate": 1.3930029954579494e-06, "loss": 1.5122, "step": 30578 }, { "epoch": 0.84, "learning_rate": 1.3925527150341044e-06, "loss": 1.2749, "step": 30579 }, { "epoch": 0.84, "learning_rate": 1.3921025019508782e-06, "loss": 1.4026, "step": 30580 }, { "epoch": 0.84, "learning_rate": 1.3916523562117956e-06, "loss": 1.0837, "step": 30581 }, { "epoch": 0.84, "learning_rate": 1.391202277820377e-06, "loss": 1.3955, "step": 30582 }, { "epoch": 0.84, "learning_rate": 1.3907522667801444e-06, "loss": 1.2234, "step": 30583 }, { "epoch": 0.84, "learning_rate": 1.3903023230946143e-06, "loss": 1.0946, "step": 30584 }, { "epoch": 0.84, "learning_rate": 1.3898524467673114e-06, "loss": 1.1091, "step": 30585 }, { "epoch": 0.84, "learning_rate": 1.389402637801759e-06, "loss": 1.2852, "step": 30586 }, { "epoch": 0.84, "learning_rate": 1.3889528962014653e-06, "loss": 1.0654, "step": 30587 }, { "epoch": 0.84, "learning_rate": 1.3885032219699578e-06, "loss": 1.2659, "step": 30588 }, { "epoch": 0.84, "learning_rate": 1.3880536151107505e-06, "loss": 1.3345, "step": 30589 }, { "epoch": 0.84, "learning_rate": 1.3876040756273657e-06, "loss": 1.1064, "step": 30590 }, { "epoch": 0.84, "learning_rate": 1.387154603523312e-06, "loss": 1.3247, "step": 30591 }, { "epoch": 0.84, "learning_rate": 1.3867051988021129e-06, "loss": 1.2795, "step": 30592 }, { "epoch": 0.84, "learning_rate": 1.3862558614672806e-06, "loss": 1.0615, "step": 30593 }, { "epoch": 0.84, "learning_rate": 1.3858065915223352e-06, "loss": 1.1882, "step": 30594 }, { "epoch": 0.84, "learning_rate": 1.385357388970785e-06, "loss": 1.2705, "step": 30595 }, { "epoch": 0.84, "learning_rate": 1.3849082538161495e-06, "loss": 1.281, "step": 30596 }, { "epoch": 0.84, "learning_rate": 1.3844591860619382e-06, "loss": 1.3416, "step": 30597 }, { "epoch": 0.84, "learning_rate": 1.3840101857116716e-06, "loss": 1.229, "step": 30598 }, { "epoch": 0.84, "learning_rate": 1.3835612527688535e-06, "loss": 1.2966, "step": 30599 }, { "epoch": 0.84, "learning_rate": 1.3831123872370012e-06, "loss": 1.4414, "step": 30600 }, { "epoch": 0.84, "learning_rate": 1.3826635891196261e-06, "loss": 1.2849, "step": 30601 }, { "epoch": 0.84, "learning_rate": 1.38221485842024e-06, "loss": 1.3628, "step": 30602 }, { "epoch": 0.84, "learning_rate": 1.3817661951423523e-06, "loss": 1.1567, "step": 30603 }, { "epoch": 0.84, "learning_rate": 1.3813175992894712e-06, "loss": 1.1995, "step": 30604 }, { "epoch": 0.84, "learning_rate": 1.3808690708651108e-06, "loss": 1.4578, "step": 30605 }, { "epoch": 0.84, "learning_rate": 1.380420609872778e-06, "loss": 1.2834, "step": 30606 }, { "epoch": 0.84, "learning_rate": 1.37997221631598e-06, "loss": 1.2678, "step": 30607 }, { "epoch": 0.84, "learning_rate": 1.3795238901982245e-06, "loss": 1.2654, "step": 30608 }, { "epoch": 0.84, "learning_rate": 1.3790756315230226e-06, "loss": 1.2563, "step": 30609 }, { "epoch": 0.84, "learning_rate": 1.3786274402938794e-06, "loss": 1.1814, "step": 30610 }, { "epoch": 0.84, "learning_rate": 1.378179316514301e-06, "loss": 1.2539, "step": 30611 }, { "epoch": 0.84, "learning_rate": 1.3777312601877902e-06, "loss": 1.3757, "step": 30612 }, { "epoch": 0.84, "learning_rate": 1.3772832713178586e-06, "loss": 1.2134, "step": 30613 }, { "epoch": 0.84, "learning_rate": 1.3768353499080078e-06, "loss": 1.3423, "step": 30614 }, { "epoch": 0.84, "learning_rate": 1.3763874959617406e-06, "loss": 1.6621, "step": 30615 }, { "epoch": 0.84, "learning_rate": 1.3759397094825644e-06, "loss": 1.3545, "step": 30616 }, { "epoch": 0.84, "learning_rate": 1.3754919904739805e-06, "loss": 1.2693, "step": 30617 }, { "epoch": 0.84, "learning_rate": 1.3750443389394918e-06, "loss": 1.177, "step": 30618 }, { "epoch": 0.84, "learning_rate": 1.3745967548825978e-06, "loss": 1.137, "step": 30619 }, { "epoch": 0.84, "learning_rate": 1.3741492383068055e-06, "loss": 1.2661, "step": 30620 }, { "epoch": 0.84, "learning_rate": 1.3737017892156134e-06, "loss": 1.2239, "step": 30621 }, { "epoch": 0.84, "learning_rate": 1.373254407612522e-06, "loss": 1.2842, "step": 30622 }, { "epoch": 0.84, "learning_rate": 1.3728070935010295e-06, "loss": 1.1823, "step": 30623 }, { "epoch": 0.84, "learning_rate": 1.37235984688464e-06, "loss": 1.1958, "step": 30624 }, { "epoch": 0.84, "learning_rate": 1.3719126677668493e-06, "loss": 1.334, "step": 30625 }, { "epoch": 0.84, "learning_rate": 1.371465556151157e-06, "loss": 1.2449, "step": 30626 }, { "epoch": 0.84, "learning_rate": 1.371018512041058e-06, "loss": 1.0923, "step": 30627 }, { "epoch": 0.84, "learning_rate": 1.370571535440056e-06, "loss": 1.2056, "step": 30628 }, { "epoch": 0.84, "learning_rate": 1.3701246263516432e-06, "loss": 1.1765, "step": 30629 }, { "epoch": 0.84, "learning_rate": 1.3696777847793185e-06, "loss": 1.0754, "step": 30630 }, { "epoch": 0.84, "learning_rate": 1.3692310107265738e-06, "loss": 1.2351, "step": 30631 }, { "epoch": 0.84, "learning_rate": 1.3687843041969063e-06, "loss": 1.4597, "step": 30632 }, { "epoch": 0.84, "learning_rate": 1.3683376651938175e-06, "loss": 1.2778, "step": 30633 }, { "epoch": 0.84, "learning_rate": 1.3678910937207912e-06, "loss": 1.2129, "step": 30634 }, { "epoch": 0.84, "learning_rate": 1.367444589781327e-06, "loss": 1.3535, "step": 30635 }, { "epoch": 0.84, "learning_rate": 1.3669981533789157e-06, "loss": 1.2336, "step": 30636 }, { "epoch": 0.84, "learning_rate": 1.3665517845170562e-06, "loss": 1.2825, "step": 30637 }, { "epoch": 0.84, "learning_rate": 1.3661054831992304e-06, "loss": 1.2783, "step": 30638 }, { "epoch": 0.84, "learning_rate": 1.365659249428939e-06, "loss": 1.3232, "step": 30639 }, { "epoch": 0.84, "learning_rate": 1.3652130832096654e-06, "loss": 1.3154, "step": 30640 }, { "epoch": 0.84, "learning_rate": 1.3647669845449096e-06, "loss": 1.3193, "step": 30641 }, { "epoch": 0.84, "learning_rate": 1.3643209534381518e-06, "loss": 1.2458, "step": 30642 }, { "epoch": 0.84, "learning_rate": 1.3638749898928894e-06, "loss": 1.3123, "step": 30643 }, { "epoch": 0.84, "learning_rate": 1.3634290939126038e-06, "loss": 1.3176, "step": 30644 }, { "epoch": 0.84, "learning_rate": 1.3629832655007935e-06, "loss": 1.123, "step": 30645 }, { "epoch": 0.84, "learning_rate": 1.3625375046609368e-06, "loss": 1.4141, "step": 30646 }, { "epoch": 0.84, "learning_rate": 1.3620918113965242e-06, "loss": 1.2261, "step": 30647 }, { "epoch": 0.84, "learning_rate": 1.3616461857110451e-06, "loss": 1.3545, "step": 30648 }, { "epoch": 0.84, "learning_rate": 1.3612006276079848e-06, "loss": 1.3818, "step": 30649 }, { "epoch": 0.84, "learning_rate": 1.360755137090829e-06, "loss": 1.395, "step": 30650 }, { "epoch": 0.84, "learning_rate": 1.3603097141630606e-06, "loss": 1.2302, "step": 30651 }, { "epoch": 0.84, "learning_rate": 1.3598643588281668e-06, "loss": 1.313, "step": 30652 }, { "epoch": 0.84, "learning_rate": 1.3594190710896327e-06, "loss": 1.2744, "step": 30653 }, { "epoch": 0.84, "learning_rate": 1.3589738509509408e-06, "loss": 1.3101, "step": 30654 }, { "epoch": 0.84, "learning_rate": 1.358528698415572e-06, "loss": 1.176, "step": 30655 }, { "epoch": 0.84, "learning_rate": 1.3580836134870123e-06, "loss": 1.2925, "step": 30656 }, { "epoch": 0.84, "learning_rate": 1.3576385961687433e-06, "loss": 1.1987, "step": 30657 }, { "epoch": 0.84, "learning_rate": 1.3571936464642466e-06, "loss": 1.3892, "step": 30658 }, { "epoch": 0.84, "learning_rate": 1.3567487643770005e-06, "loss": 1.2161, "step": 30659 }, { "epoch": 0.84, "learning_rate": 1.3563039499104891e-06, "loss": 1.3313, "step": 30660 }, { "epoch": 0.84, "learning_rate": 1.3558592030681916e-06, "loss": 1.2849, "step": 30661 }, { "epoch": 0.84, "learning_rate": 1.3554145238535844e-06, "loss": 1.179, "step": 30662 }, { "epoch": 0.84, "learning_rate": 1.354969912270151e-06, "loss": 1.281, "step": 30663 }, { "epoch": 0.84, "learning_rate": 1.3545253683213677e-06, "loss": 1.3098, "step": 30664 }, { "epoch": 0.84, "learning_rate": 1.3540808920107129e-06, "loss": 1.2886, "step": 30665 }, { "epoch": 0.84, "learning_rate": 1.3536364833416615e-06, "loss": 1.1782, "step": 30666 }, { "epoch": 0.84, "learning_rate": 1.3531921423176953e-06, "loss": 1.2441, "step": 30667 }, { "epoch": 0.84, "learning_rate": 1.3527478689422869e-06, "loss": 1.1565, "step": 30668 }, { "epoch": 0.84, "learning_rate": 1.3523036632189136e-06, "loss": 1.2317, "step": 30669 }, { "epoch": 0.84, "learning_rate": 1.3518595251510469e-06, "loss": 1.3276, "step": 30670 }, { "epoch": 0.84, "learning_rate": 1.3514154547421665e-06, "loss": 1.3218, "step": 30671 }, { "epoch": 0.84, "learning_rate": 1.3509714519957463e-06, "loss": 1.3779, "step": 30672 }, { "epoch": 0.84, "learning_rate": 1.3505275169152575e-06, "loss": 1.3335, "step": 30673 }, { "epoch": 0.84, "learning_rate": 1.3500836495041715e-06, "loss": 1.2581, "step": 30674 }, { "epoch": 0.84, "learning_rate": 1.3496398497659668e-06, "loss": 1.2671, "step": 30675 }, { "epoch": 0.84, "learning_rate": 1.3491961177041113e-06, "loss": 1.2537, "step": 30676 }, { "epoch": 0.84, "learning_rate": 1.3487524533220763e-06, "loss": 1.1471, "step": 30677 }, { "epoch": 0.84, "learning_rate": 1.348308856623335e-06, "loss": 1.1812, "step": 30678 }, { "epoch": 0.84, "learning_rate": 1.347865327611355e-06, "loss": 1.1929, "step": 30679 }, { "epoch": 0.84, "learning_rate": 1.3474218662896132e-06, "loss": 1.3645, "step": 30680 }, { "epoch": 0.84, "learning_rate": 1.3469784726615698e-06, "loss": 1.2344, "step": 30681 }, { "epoch": 0.84, "learning_rate": 1.3465351467306986e-06, "loss": 1.2444, "step": 30682 }, { "epoch": 0.84, "learning_rate": 1.346091888500466e-06, "loss": 1.01, "step": 30683 }, { "epoch": 0.84, "learning_rate": 1.3456486979743454e-06, "loss": 1.2546, "step": 30684 }, { "epoch": 0.84, "learning_rate": 1.3452055751557957e-06, "loss": 1.3181, "step": 30685 }, { "epoch": 0.84, "learning_rate": 1.3447625200482906e-06, "loss": 1.2363, "step": 30686 }, { "epoch": 0.84, "learning_rate": 1.3443195326552904e-06, "loss": 1.2358, "step": 30687 }, { "epoch": 0.84, "learning_rate": 1.3438766129802683e-06, "loss": 1.2341, "step": 30688 }, { "epoch": 0.84, "learning_rate": 1.3434337610266812e-06, "loss": 1.1218, "step": 30689 }, { "epoch": 0.84, "learning_rate": 1.3429909767979999e-06, "loss": 1.2859, "step": 30690 }, { "epoch": 0.84, "learning_rate": 1.3425482602976836e-06, "loss": 1.3643, "step": 30691 }, { "epoch": 0.84, "learning_rate": 1.3421056115292041e-06, "loss": 1.2424, "step": 30692 }, { "epoch": 0.84, "learning_rate": 1.3416630304960144e-06, "loss": 1.3831, "step": 30693 }, { "epoch": 0.84, "learning_rate": 1.3412205172015813e-06, "loss": 1.3621, "step": 30694 }, { "epoch": 0.84, "learning_rate": 1.340778071649369e-06, "loss": 1.3101, "step": 30695 }, { "epoch": 0.84, "learning_rate": 1.3403356938428381e-06, "loss": 1.2827, "step": 30696 }, { "epoch": 0.84, "learning_rate": 1.3398933837854489e-06, "loss": 1.282, "step": 30697 }, { "epoch": 0.84, "learning_rate": 1.3394511414806587e-06, "loss": 1.2419, "step": 30698 }, { "epoch": 0.84, "learning_rate": 1.3390089669319329e-06, "loss": 1.3345, "step": 30699 }, { "epoch": 0.84, "learning_rate": 1.3385668601427283e-06, "loss": 1.2383, "step": 30700 }, { "epoch": 0.84, "learning_rate": 1.3381248211165031e-06, "loss": 1.2283, "step": 30701 }, { "epoch": 0.84, "learning_rate": 1.337682849856714e-06, "loss": 1.4009, "step": 30702 }, { "epoch": 0.84, "learning_rate": 1.3372409463668235e-06, "loss": 1.2458, "step": 30703 }, { "epoch": 0.84, "learning_rate": 1.3367991106502865e-06, "loss": 1.1882, "step": 30704 }, { "epoch": 0.84, "learning_rate": 1.336357342710559e-06, "loss": 1.1899, "step": 30705 }, { "epoch": 0.84, "learning_rate": 1.3359156425510966e-06, "loss": 1.2449, "step": 30706 }, { "epoch": 0.84, "learning_rate": 1.3354740101753571e-06, "loss": 1.1799, "step": 30707 }, { "epoch": 0.84, "learning_rate": 1.3350324455867948e-06, "loss": 1.2996, "step": 30708 }, { "epoch": 0.84, "learning_rate": 1.334590948788862e-06, "loss": 1.3901, "step": 30709 }, { "epoch": 0.84, "learning_rate": 1.3341495197850175e-06, "loss": 1.1155, "step": 30710 }, { "epoch": 0.84, "learning_rate": 1.3337081585787115e-06, "loss": 1.2649, "step": 30711 }, { "epoch": 0.84, "learning_rate": 1.3332668651733982e-06, "loss": 1.3359, "step": 30712 }, { "epoch": 0.84, "learning_rate": 1.3328256395725281e-06, "loss": 1.2822, "step": 30713 }, { "epoch": 0.84, "learning_rate": 1.332384481779555e-06, "loss": 1.1411, "step": 30714 }, { "epoch": 0.84, "learning_rate": 1.3319433917979318e-06, "loss": 1.3435, "step": 30715 }, { "epoch": 0.84, "learning_rate": 1.3315023696311057e-06, "loss": 1.7095, "step": 30716 }, { "epoch": 0.84, "learning_rate": 1.3310614152825274e-06, "loss": 1.146, "step": 30717 }, { "epoch": 0.84, "learning_rate": 1.3306205287556505e-06, "loss": 1.209, "step": 30718 }, { "epoch": 0.84, "learning_rate": 1.3301797100539226e-06, "loss": 1.1128, "step": 30719 }, { "epoch": 0.84, "learning_rate": 1.3297389591807908e-06, "loss": 1.2046, "step": 30720 }, { "epoch": 0.84, "learning_rate": 1.3292982761397022e-06, "loss": 1.2847, "step": 30721 }, { "epoch": 0.84, "learning_rate": 1.3288576609341097e-06, "loss": 1.689, "step": 30722 }, { "epoch": 0.84, "learning_rate": 1.3284171135674562e-06, "loss": 1.2441, "step": 30723 }, { "epoch": 0.84, "learning_rate": 1.3279766340431887e-06, "loss": 1.1833, "step": 30724 }, { "epoch": 0.84, "learning_rate": 1.3275362223647558e-06, "loss": 1.2346, "step": 30725 }, { "epoch": 0.84, "learning_rate": 1.327095878535598e-06, "loss": 1.3157, "step": 30726 }, { "epoch": 0.84, "learning_rate": 1.3266556025591693e-06, "loss": 1.1262, "step": 30727 }, { "epoch": 0.84, "learning_rate": 1.3262153944389044e-06, "loss": 1.167, "step": 30728 }, { "epoch": 0.84, "learning_rate": 1.325775254178253e-06, "loss": 1.1824, "step": 30729 }, { "epoch": 0.84, "learning_rate": 1.325335181780656e-06, "loss": 1.2275, "step": 30730 }, { "epoch": 0.84, "learning_rate": 1.324895177249561e-06, "loss": 1.3955, "step": 30731 }, { "epoch": 0.84, "learning_rate": 1.3244552405884025e-06, "loss": 1.1335, "step": 30732 }, { "epoch": 0.84, "learning_rate": 1.3240153718006298e-06, "loss": 1.3247, "step": 30733 }, { "epoch": 0.84, "learning_rate": 1.3235755708896781e-06, "loss": 1.3535, "step": 30734 }, { "epoch": 0.84, "learning_rate": 1.3231358378589953e-06, "loss": 1.3699, "step": 30735 }, { "epoch": 0.84, "learning_rate": 1.3226961727120135e-06, "loss": 1.2144, "step": 30736 }, { "epoch": 0.84, "learning_rate": 1.3222565754521787e-06, "loss": 1.2559, "step": 30737 }, { "epoch": 0.84, "learning_rate": 1.321817046082926e-06, "loss": 1.2368, "step": 30738 }, { "epoch": 0.84, "learning_rate": 1.321377584607697e-06, "loss": 1.177, "step": 30739 }, { "epoch": 0.84, "learning_rate": 1.3209381910299302e-06, "loss": 1.3125, "step": 30740 }, { "epoch": 0.84, "learning_rate": 1.3204988653530593e-06, "loss": 1.1577, "step": 30741 }, { "epoch": 0.84, "learning_rate": 1.320059607580525e-06, "loss": 1.1997, "step": 30742 }, { "epoch": 0.84, "learning_rate": 1.3196204177157635e-06, "loss": 1.7612, "step": 30743 }, { "epoch": 0.84, "learning_rate": 1.3191812957622107e-06, "loss": 1.325, "step": 30744 }, { "epoch": 0.84, "learning_rate": 1.3187422417232986e-06, "loss": 1.4138, "step": 30745 }, { "epoch": 0.84, "learning_rate": 1.3183032556024666e-06, "loss": 1.2578, "step": 30746 }, { "epoch": 0.84, "learning_rate": 1.3178643374031485e-06, "loss": 1.2827, "step": 30747 }, { "epoch": 0.84, "learning_rate": 1.3174254871287773e-06, "loss": 1.2827, "step": 30748 }, { "epoch": 0.84, "learning_rate": 1.3169867047827833e-06, "loss": 1.3174, "step": 30749 }, { "epoch": 0.84, "learning_rate": 1.316547990368604e-06, "loss": 1.27, "step": 30750 }, { "epoch": 0.84, "learning_rate": 1.316109343889671e-06, "loss": 1.3123, "step": 30751 }, { "epoch": 0.84, "learning_rate": 1.315670765349415e-06, "loss": 1.2266, "step": 30752 }, { "epoch": 0.84, "learning_rate": 1.3152322547512653e-06, "loss": 1.1941, "step": 30753 }, { "epoch": 0.84, "learning_rate": 1.314793812098656e-06, "loss": 1.3848, "step": 30754 }, { "epoch": 0.84, "learning_rate": 1.3143554373950162e-06, "loss": 1.335, "step": 30755 }, { "epoch": 0.84, "learning_rate": 1.3139171306437725e-06, "loss": 1.3345, "step": 30756 }, { "epoch": 0.84, "learning_rate": 1.3134788918483598e-06, "loss": 1.3093, "step": 30757 }, { "epoch": 0.84, "learning_rate": 1.3130407210122032e-06, "loss": 1.3162, "step": 30758 }, { "epoch": 0.84, "learning_rate": 1.3126026181387308e-06, "loss": 1.3469, "step": 30759 }, { "epoch": 0.84, "learning_rate": 1.3121645832313678e-06, "loss": 1.4617, "step": 30760 }, { "epoch": 0.84, "learning_rate": 1.3117266162935472e-06, "loss": 1.6479, "step": 30761 }, { "epoch": 0.84, "learning_rate": 1.3112887173286914e-06, "loss": 1.1909, "step": 30762 }, { "epoch": 0.84, "learning_rate": 1.310850886340227e-06, "loss": 1.2058, "step": 30763 }, { "epoch": 0.84, "learning_rate": 1.3104131233315777e-06, "loss": 1.2244, "step": 30764 }, { "epoch": 0.84, "learning_rate": 1.3099754283061706e-06, "loss": 1.2372, "step": 30765 }, { "epoch": 0.84, "learning_rate": 1.3095378012674309e-06, "loss": 1.4392, "step": 30766 }, { "epoch": 0.84, "learning_rate": 1.3091002422187805e-06, "loss": 1.2476, "step": 30767 }, { "epoch": 0.84, "learning_rate": 1.3086627511636408e-06, "loss": 1.2861, "step": 30768 }, { "epoch": 0.84, "learning_rate": 1.308225328105439e-06, "loss": 1.3784, "step": 30769 }, { "epoch": 0.84, "learning_rate": 1.307787973047595e-06, "loss": 1.4329, "step": 30770 }, { "epoch": 0.84, "learning_rate": 1.307350685993528e-06, "loss": 1.2676, "step": 30771 }, { "epoch": 0.84, "learning_rate": 1.3069134669466644e-06, "loss": 1.2996, "step": 30772 }, { "epoch": 0.84, "learning_rate": 1.3064763159104199e-06, "loss": 1.1611, "step": 30773 }, { "epoch": 0.84, "learning_rate": 1.306039232888221e-06, "loss": 1.321, "step": 30774 }, { "epoch": 0.84, "learning_rate": 1.3056022178834782e-06, "loss": 1.1675, "step": 30775 }, { "epoch": 0.84, "learning_rate": 1.3051652708996176e-06, "loss": 1.2126, "step": 30776 }, { "epoch": 0.84, "learning_rate": 1.3047283919400532e-06, "loss": 1.5684, "step": 30777 }, { "epoch": 0.84, "learning_rate": 1.304291581008208e-06, "loss": 1.3086, "step": 30778 }, { "epoch": 0.84, "learning_rate": 1.3038548381074957e-06, "loss": 1.2026, "step": 30779 }, { "epoch": 0.84, "learning_rate": 1.3034181632413335e-06, "loss": 1.3264, "step": 30780 }, { "epoch": 0.84, "learning_rate": 1.3029815564131366e-06, "loss": 1.0635, "step": 30781 }, { "epoch": 0.84, "learning_rate": 1.3025450176263243e-06, "loss": 1.2739, "step": 30782 }, { "epoch": 0.84, "learning_rate": 1.302108546884311e-06, "loss": 1.1594, "step": 30783 }, { "epoch": 0.84, "learning_rate": 1.3016721441905089e-06, "loss": 1.7168, "step": 30784 }, { "epoch": 0.84, "learning_rate": 1.3012358095483324e-06, "loss": 1.3052, "step": 30785 }, { "epoch": 0.84, "learning_rate": 1.3007995429611975e-06, "loss": 1.1218, "step": 30786 }, { "epoch": 0.84, "learning_rate": 1.3003633444325182e-06, "loss": 1.345, "step": 30787 }, { "epoch": 0.84, "learning_rate": 1.2999272139657016e-06, "loss": 1.1565, "step": 30788 }, { "epoch": 0.84, "learning_rate": 1.299491151564166e-06, "loss": 1.4553, "step": 30789 }, { "epoch": 0.84, "learning_rate": 1.2990551572313203e-06, "loss": 1.249, "step": 30790 }, { "epoch": 0.84, "learning_rate": 1.298619230970576e-06, "loss": 1.282, "step": 30791 }, { "epoch": 0.84, "learning_rate": 1.298183372785341e-06, "loss": 1.2627, "step": 30792 }, { "epoch": 0.84, "learning_rate": 1.2977475826790287e-06, "loss": 1.0671, "step": 30793 }, { "epoch": 0.84, "learning_rate": 1.2973118606550484e-06, "loss": 1.2605, "step": 30794 }, { "epoch": 0.84, "learning_rate": 1.2968762067168062e-06, "loss": 1.3101, "step": 30795 }, { "epoch": 0.84, "learning_rate": 1.2964406208677115e-06, "loss": 1.1782, "step": 30796 }, { "epoch": 0.84, "learning_rate": 1.2960051031111743e-06, "loss": 1.3569, "step": 30797 }, { "epoch": 0.84, "learning_rate": 1.2955696534506002e-06, "loss": 1.3145, "step": 30798 }, { "epoch": 0.84, "learning_rate": 1.2951342718893956e-06, "loss": 1.2988, "step": 30799 }, { "epoch": 0.84, "learning_rate": 1.2946989584309654e-06, "loss": 1.3701, "step": 30800 }, { "epoch": 0.84, "learning_rate": 1.2942637130787194e-06, "loss": 1.1071, "step": 30801 }, { "epoch": 0.84, "learning_rate": 1.2938285358360603e-06, "loss": 1.2793, "step": 30802 }, { "epoch": 0.84, "learning_rate": 1.2933934267063908e-06, "loss": 1.4026, "step": 30803 }, { "epoch": 0.84, "learning_rate": 1.2929583856931182e-06, "loss": 1.3381, "step": 30804 }, { "epoch": 0.84, "learning_rate": 1.2925234127996456e-06, "loss": 1.1555, "step": 30805 }, { "epoch": 0.84, "learning_rate": 1.2920885080293754e-06, "loss": 1.3801, "step": 30806 }, { "epoch": 0.84, "learning_rate": 1.2916536713857075e-06, "loss": 1.3384, "step": 30807 }, { "epoch": 0.84, "learning_rate": 1.291218902872049e-06, "loss": 1.2869, "step": 30808 }, { "epoch": 0.84, "learning_rate": 1.290784202491796e-06, "loss": 1.272, "step": 30809 }, { "epoch": 0.84, "learning_rate": 1.290349570248356e-06, "loss": 1.2908, "step": 30810 }, { "epoch": 0.84, "learning_rate": 1.2899150061451215e-06, "loss": 1.2446, "step": 30811 }, { "epoch": 0.84, "learning_rate": 1.289480510185499e-06, "loss": 1.2197, "step": 30812 }, { "epoch": 0.84, "learning_rate": 1.2890460823728823e-06, "loss": 1.1426, "step": 30813 }, { "epoch": 0.84, "learning_rate": 1.2886117227106765e-06, "loss": 1.3784, "step": 30814 }, { "epoch": 0.84, "learning_rate": 1.2881774312022731e-06, "loss": 1.3267, "step": 30815 }, { "epoch": 0.84, "learning_rate": 1.2877432078510742e-06, "loss": 1.2412, "step": 30816 }, { "epoch": 0.84, "learning_rate": 1.2873090526604737e-06, "loss": 1.1941, "step": 30817 }, { "epoch": 0.84, "learning_rate": 1.2868749656338719e-06, "loss": 1.1543, "step": 30818 }, { "epoch": 0.84, "learning_rate": 1.2864409467746641e-06, "loss": 1.3135, "step": 30819 }, { "epoch": 0.84, "learning_rate": 1.286006996086242e-06, "loss": 1.3655, "step": 30820 }, { "epoch": 0.84, "learning_rate": 1.2855731135720062e-06, "loss": 1.2971, "step": 30821 }, { "epoch": 0.84, "learning_rate": 1.2851392992353485e-06, "loss": 1.2568, "step": 30822 }, { "epoch": 0.84, "learning_rate": 1.2847055530796627e-06, "loss": 1.1494, "step": 30823 }, { "epoch": 0.84, "learning_rate": 1.2842718751083405e-06, "loss": 1.1392, "step": 30824 }, { "epoch": 0.84, "learning_rate": 1.2838382653247794e-06, "loss": 1.1907, "step": 30825 }, { "epoch": 0.84, "learning_rate": 1.2834047237323677e-06, "loss": 1.1382, "step": 30826 }, { "epoch": 0.84, "learning_rate": 1.2829712503344994e-06, "loss": 1.1953, "step": 30827 }, { "epoch": 0.84, "learning_rate": 1.2825378451345628e-06, "loss": 1.3052, "step": 30828 }, { "epoch": 0.84, "learning_rate": 1.2821045081359528e-06, "loss": 1.2227, "step": 30829 }, { "epoch": 0.84, "learning_rate": 1.2816712393420583e-06, "loss": 1.2881, "step": 30830 }, { "epoch": 0.84, "learning_rate": 1.2812380387562683e-06, "loss": 1.3354, "step": 30831 }, { "epoch": 0.84, "learning_rate": 1.2808049063819694e-06, "loss": 1.3328, "step": 30832 }, { "epoch": 0.84, "learning_rate": 1.2803718422225553e-06, "loss": 1.208, "step": 30833 }, { "epoch": 0.84, "learning_rate": 1.2799388462814111e-06, "loss": 1.3201, "step": 30834 }, { "epoch": 0.84, "learning_rate": 1.279505918561923e-06, "loss": 1.2229, "step": 30835 }, { "epoch": 0.84, "learning_rate": 1.2790730590674826e-06, "loss": 1.1663, "step": 30836 }, { "epoch": 0.84, "learning_rate": 1.2786402678014731e-06, "loss": 1.1655, "step": 30837 }, { "epoch": 0.84, "learning_rate": 1.2782075447672816e-06, "loss": 1.688, "step": 30838 }, { "epoch": 0.84, "learning_rate": 1.2777748899682907e-06, "loss": 1.3425, "step": 30839 }, { "epoch": 0.84, "learning_rate": 1.2773423034078903e-06, "loss": 1.3796, "step": 30840 }, { "epoch": 0.84, "learning_rate": 1.2769097850894607e-06, "loss": 1.0029, "step": 30841 }, { "epoch": 0.84, "learning_rate": 1.2764773350163884e-06, "loss": 1.2151, "step": 30842 }, { "epoch": 0.84, "learning_rate": 1.2760449531920516e-06, "loss": 1.2075, "step": 30843 }, { "epoch": 0.84, "learning_rate": 1.2756126396198398e-06, "loss": 1.2146, "step": 30844 }, { "epoch": 0.84, "learning_rate": 1.2751803943031327e-06, "loss": 1.4011, "step": 30845 }, { "epoch": 0.84, "learning_rate": 1.2747482172453106e-06, "loss": 1.1543, "step": 30846 }, { "epoch": 0.84, "learning_rate": 1.2743161084497546e-06, "loss": 1.229, "step": 30847 }, { "epoch": 0.84, "learning_rate": 1.273884067919845e-06, "loss": 1.4243, "step": 30848 }, { "epoch": 0.84, "learning_rate": 1.273452095658968e-06, "loss": 1.1108, "step": 30849 }, { "epoch": 0.84, "learning_rate": 1.2730201916704943e-06, "loss": 1.2947, "step": 30850 }, { "epoch": 0.84, "learning_rate": 1.2725883559578089e-06, "loss": 1.1259, "step": 30851 }, { "epoch": 0.84, "learning_rate": 1.272156588524286e-06, "loss": 1.292, "step": 30852 }, { "epoch": 0.84, "learning_rate": 1.2717248893733103e-06, "loss": 1.6758, "step": 30853 }, { "epoch": 0.84, "learning_rate": 1.2712932585082493e-06, "loss": 1.3376, "step": 30854 }, { "epoch": 0.84, "learning_rate": 1.2708616959324893e-06, "loss": 1.2229, "step": 30855 }, { "epoch": 0.84, "learning_rate": 1.2704302016493985e-06, "loss": 1.2019, "step": 30856 }, { "epoch": 0.84, "learning_rate": 1.2699987756623633e-06, "loss": 1.1616, "step": 30857 }, { "epoch": 0.84, "learning_rate": 1.2695674179747464e-06, "loss": 1.2388, "step": 30858 }, { "epoch": 0.84, "learning_rate": 1.2691361285899318e-06, "loss": 1.2222, "step": 30859 }, { "epoch": 0.84, "learning_rate": 1.268704907511289e-06, "loss": 1.2656, "step": 30860 }, { "epoch": 0.84, "learning_rate": 1.2682737547421964e-06, "loss": 1.1853, "step": 30861 }, { "epoch": 0.84, "learning_rate": 1.2678426702860203e-06, "loss": 1.2419, "step": 30862 }, { "epoch": 0.84, "learning_rate": 1.2674116541461368e-06, "loss": 1.2825, "step": 30863 }, { "epoch": 0.84, "learning_rate": 1.2669807063259199e-06, "loss": 1.1904, "step": 30864 }, { "epoch": 0.84, "learning_rate": 1.2665498268287402e-06, "loss": 1.2324, "step": 30865 }, { "epoch": 0.84, "learning_rate": 1.2661190156579672e-06, "loss": 1.1709, "step": 30866 }, { "epoch": 0.84, "learning_rate": 1.2656882728169705e-06, "loss": 1.1528, "step": 30867 }, { "epoch": 0.84, "learning_rate": 1.2652575983091242e-06, "loss": 1.3816, "step": 30868 }, { "epoch": 0.84, "learning_rate": 1.2648269921377943e-06, "loss": 1.3547, "step": 30869 }, { "epoch": 0.84, "learning_rate": 1.2643964543063502e-06, "loss": 1.2026, "step": 30870 }, { "epoch": 0.84, "learning_rate": 1.2639659848181584e-06, "loss": 1.2759, "step": 30871 }, { "epoch": 0.84, "learning_rate": 1.2635355836765918e-06, "loss": 1.1689, "step": 30872 }, { "epoch": 0.84, "learning_rate": 1.263105250885014e-06, "loss": 1.3088, "step": 30873 }, { "epoch": 0.84, "learning_rate": 1.2626749864467924e-06, "loss": 1.3477, "step": 30874 }, { "epoch": 0.84, "learning_rate": 1.2622447903652902e-06, "loss": 1.2622, "step": 30875 }, { "epoch": 0.84, "learning_rate": 1.2618146626438788e-06, "loss": 1.2839, "step": 30876 }, { "epoch": 0.84, "learning_rate": 1.2613846032859211e-06, "loss": 1.2605, "step": 30877 }, { "epoch": 0.84, "learning_rate": 1.2609546122947801e-06, "loss": 1.0923, "step": 30878 }, { "epoch": 0.84, "learning_rate": 1.26052468967382e-06, "loss": 1.5132, "step": 30879 }, { "epoch": 0.84, "learning_rate": 1.2600948354264053e-06, "loss": 1.2017, "step": 30880 }, { "epoch": 0.84, "learning_rate": 1.2596650495559005e-06, "loss": 1.2246, "step": 30881 }, { "epoch": 0.84, "learning_rate": 1.2592353320656637e-06, "loss": 1.4385, "step": 30882 }, { "epoch": 0.84, "learning_rate": 1.258805682959061e-06, "loss": 1.1704, "step": 30883 }, { "epoch": 0.84, "learning_rate": 1.2583761022394537e-06, "loss": 1.3179, "step": 30884 }, { "epoch": 0.84, "learning_rate": 1.2579465899101996e-06, "loss": 1.2891, "step": 30885 }, { "epoch": 0.84, "learning_rate": 1.2575171459746593e-06, "loss": 1.1025, "step": 30886 }, { "epoch": 0.84, "learning_rate": 1.257087770436195e-06, "loss": 1.3638, "step": 30887 }, { "epoch": 0.84, "learning_rate": 1.256658463298166e-06, "loss": 1.0347, "step": 30888 }, { "epoch": 0.84, "learning_rate": 1.2562292245639296e-06, "loss": 1.2705, "step": 30889 }, { "epoch": 0.84, "learning_rate": 1.255800054236842e-06, "loss": 1.7041, "step": 30890 }, { "epoch": 0.84, "learning_rate": 1.255370952320264e-06, "loss": 1.2783, "step": 30891 }, { "epoch": 0.84, "learning_rate": 1.2549419188175527e-06, "loss": 1.1887, "step": 30892 }, { "epoch": 0.84, "learning_rate": 1.2545129537320634e-06, "loss": 1.0461, "step": 30893 }, { "epoch": 0.84, "learning_rate": 1.2540840570671497e-06, "loss": 1.0022, "step": 30894 }, { "epoch": 0.84, "learning_rate": 1.2536552288261705e-06, "loss": 1.209, "step": 30895 }, { "epoch": 0.84, "learning_rate": 1.2532264690124841e-06, "loss": 1.3745, "step": 30896 }, { "epoch": 0.84, "learning_rate": 1.2527977776294365e-06, "loss": 1.1602, "step": 30897 }, { "epoch": 0.84, "learning_rate": 1.2523691546803872e-06, "loss": 1.1875, "step": 30898 }, { "epoch": 0.84, "learning_rate": 1.2519406001686874e-06, "loss": 1.2219, "step": 30899 }, { "epoch": 0.84, "learning_rate": 1.2515121140976937e-06, "loss": 1.2543, "step": 30900 }, { "epoch": 0.84, "learning_rate": 1.2510836964707518e-06, "loss": 1.2056, "step": 30901 }, { "epoch": 0.84, "learning_rate": 1.2506553472912197e-06, "loss": 1.2659, "step": 30902 }, { "epoch": 0.84, "learning_rate": 1.2502270665624428e-06, "loss": 1.2407, "step": 30903 }, { "epoch": 0.84, "learning_rate": 1.2497988542877805e-06, "loss": 1.2185, "step": 30904 }, { "epoch": 0.84, "learning_rate": 1.249370710470571e-06, "loss": 1.2693, "step": 30905 }, { "epoch": 0.84, "learning_rate": 1.2489426351141743e-06, "loss": 1.1233, "step": 30906 }, { "epoch": 0.84, "learning_rate": 1.2485146282219319e-06, "loss": 1.4546, "step": 30907 }, { "epoch": 0.84, "learning_rate": 1.248086689797201e-06, "loss": 1.2141, "step": 30908 }, { "epoch": 0.84, "learning_rate": 1.2476588198433193e-06, "loss": 1.292, "step": 30909 }, { "epoch": 0.84, "learning_rate": 1.2472310183636405e-06, "loss": 1.3408, "step": 30910 }, { "epoch": 0.84, "learning_rate": 1.246803285361511e-06, "loss": 1.2249, "step": 30911 }, { "epoch": 0.84, "learning_rate": 1.2463756208402778e-06, "loss": 1.2153, "step": 30912 }, { "epoch": 0.84, "learning_rate": 1.2459480248032851e-06, "loss": 1.2986, "step": 30913 }, { "epoch": 0.84, "learning_rate": 1.245520497253876e-06, "loss": 1.2957, "step": 30914 }, { "epoch": 0.84, "learning_rate": 1.2450930381954007e-06, "loss": 1.1294, "step": 30915 }, { "epoch": 0.84, "learning_rate": 1.2446656476312002e-06, "loss": 1.2737, "step": 30916 }, { "epoch": 0.84, "learning_rate": 1.2442383255646185e-06, "loss": 1.2708, "step": 30917 }, { "epoch": 0.84, "learning_rate": 1.243811071998997e-06, "loss": 1.1282, "step": 30918 }, { "epoch": 0.84, "learning_rate": 1.2433838869376824e-06, "loss": 1.5881, "step": 30919 }, { "epoch": 0.84, "learning_rate": 1.242956770384015e-06, "loss": 1.2651, "step": 30920 }, { "epoch": 0.84, "learning_rate": 1.2425297223413356e-06, "loss": 1.248, "step": 30921 }, { "epoch": 0.84, "learning_rate": 1.2421027428129838e-06, "loss": 1.2371, "step": 30922 }, { "epoch": 0.84, "learning_rate": 1.2416758318023037e-06, "loss": 1.1992, "step": 30923 }, { "epoch": 0.84, "learning_rate": 1.2412489893126333e-06, "loss": 1.3816, "step": 30924 }, { "epoch": 0.84, "learning_rate": 1.2408222153473105e-06, "loss": 1.3245, "step": 30925 }, { "epoch": 0.84, "learning_rate": 1.2403955099096775e-06, "loss": 1.3323, "step": 30926 }, { "epoch": 0.84, "learning_rate": 1.2399688730030712e-06, "loss": 1.1345, "step": 30927 }, { "epoch": 0.84, "learning_rate": 1.2395423046308285e-06, "loss": 1.2256, "step": 30928 }, { "epoch": 0.84, "learning_rate": 1.239115804796286e-06, "loss": 1.2734, "step": 30929 }, { "epoch": 0.84, "learning_rate": 1.238689373502784e-06, "loss": 1.075, "step": 30930 }, { "epoch": 0.84, "learning_rate": 1.2382630107536564e-06, "loss": 1.3313, "step": 30931 }, { "epoch": 0.84, "learning_rate": 1.2378367165522386e-06, "loss": 1.2876, "step": 30932 }, { "epoch": 0.84, "learning_rate": 1.2374104909018637e-06, "loss": 1.3599, "step": 30933 }, { "epoch": 0.84, "learning_rate": 1.2369843338058718e-06, "loss": 1.325, "step": 30934 }, { "epoch": 0.84, "learning_rate": 1.2365582452675927e-06, "loss": 1.2681, "step": 30935 }, { "epoch": 0.84, "learning_rate": 1.2361322252903619e-06, "loss": 1.2488, "step": 30936 }, { "epoch": 0.84, "learning_rate": 1.2357062738775082e-06, "loss": 1.2842, "step": 30937 }, { "epoch": 0.84, "learning_rate": 1.2352803910323708e-06, "loss": 1.2185, "step": 30938 }, { "epoch": 0.84, "learning_rate": 1.2348545767582777e-06, "loss": 1.26, "step": 30939 }, { "epoch": 0.84, "learning_rate": 1.2344288310585605e-06, "loss": 1.1765, "step": 30940 }, { "epoch": 0.84, "learning_rate": 1.2340031539365483e-06, "loss": 1.2888, "step": 30941 }, { "epoch": 0.85, "learning_rate": 1.2335775453955734e-06, "loss": 1.3174, "step": 30942 }, { "epoch": 0.85, "learning_rate": 1.2331520054389701e-06, "loss": 1.2588, "step": 30943 }, { "epoch": 0.85, "learning_rate": 1.2327265340700579e-06, "loss": 1.2859, "step": 30944 }, { "epoch": 0.85, "learning_rate": 1.2323011312921728e-06, "loss": 1.3225, "step": 30945 }, { "epoch": 0.85, "learning_rate": 1.2318757971086392e-06, "loss": 1.3101, "step": 30946 }, { "epoch": 0.85, "learning_rate": 1.2314505315227909e-06, "loss": 1.2581, "step": 30947 }, { "epoch": 0.85, "learning_rate": 1.2310253345379463e-06, "loss": 1.4231, "step": 30948 }, { "epoch": 0.85, "learning_rate": 1.2306002061574374e-06, "loss": 1.3643, "step": 30949 }, { "epoch": 0.85, "learning_rate": 1.2301751463845868e-06, "loss": 1.1001, "step": 30950 }, { "epoch": 0.85, "learning_rate": 1.2297501552227265e-06, "loss": 1.3716, "step": 30951 }, { "epoch": 0.85, "learning_rate": 1.2293252326751726e-06, "loss": 1.3022, "step": 30952 }, { "epoch": 0.85, "learning_rate": 1.228900378745256e-06, "loss": 1.1504, "step": 30953 }, { "epoch": 0.85, "learning_rate": 1.2284755934362957e-06, "loss": 1.1841, "step": 30954 }, { "epoch": 0.85, "learning_rate": 1.228050876751622e-06, "loss": 1.2683, "step": 30955 }, { "epoch": 0.85, "learning_rate": 1.2276262286945494e-06, "loss": 1.3301, "step": 30956 }, { "epoch": 0.85, "learning_rate": 1.2272016492684047e-06, "loss": 1.3457, "step": 30957 }, { "epoch": 0.85, "learning_rate": 1.2267771384765104e-06, "loss": 1.2156, "step": 30958 }, { "epoch": 0.85, "learning_rate": 1.226352696322186e-06, "loss": 1.3105, "step": 30959 }, { "epoch": 0.85, "learning_rate": 1.2259283228087536e-06, "loss": 1.3325, "step": 30960 }, { "epoch": 0.85, "learning_rate": 1.2255040179395294e-06, "loss": 1.2443, "step": 30961 }, { "epoch": 0.85, "learning_rate": 1.2250797817178384e-06, "loss": 1.4021, "step": 30962 }, { "epoch": 0.85, "learning_rate": 1.2246556141469956e-06, "loss": 1.1865, "step": 30963 }, { "epoch": 0.85, "learning_rate": 1.224231515230322e-06, "loss": 1.3389, "step": 30964 }, { "epoch": 0.85, "learning_rate": 1.2238074849711323e-06, "loss": 1.2634, "step": 30965 }, { "epoch": 0.85, "learning_rate": 1.2233835233727475e-06, "loss": 1.1716, "step": 30966 }, { "epoch": 0.85, "learning_rate": 1.2229596304384828e-06, "loss": 1.261, "step": 30967 }, { "epoch": 0.85, "learning_rate": 1.2225358061716553e-06, "loss": 1.1714, "step": 30968 }, { "epoch": 0.85, "learning_rate": 1.222112050575578e-06, "loss": 1.1162, "step": 30969 }, { "epoch": 0.85, "learning_rate": 1.2216883636535693e-06, "loss": 1.2417, "step": 30970 }, { "epoch": 0.85, "learning_rate": 1.2212647454089443e-06, "loss": 1.6597, "step": 30971 }, { "epoch": 0.85, "learning_rate": 1.220841195845014e-06, "loss": 1.1023, "step": 30972 }, { "epoch": 0.85, "learning_rate": 1.2204177149650952e-06, "loss": 1.2712, "step": 30973 }, { "epoch": 0.85, "learning_rate": 1.2199943027725002e-06, "loss": 1.3108, "step": 30974 }, { "epoch": 0.85, "learning_rate": 1.2195709592705408e-06, "loss": 1.2747, "step": 30975 }, { "epoch": 0.85, "learning_rate": 1.219147684462527e-06, "loss": 1.4668, "step": 30976 }, { "epoch": 0.85, "learning_rate": 1.218724478351776e-06, "loss": 1.3787, "step": 30977 }, { "epoch": 0.85, "learning_rate": 1.2183013409415945e-06, "loss": 1.1196, "step": 30978 }, { "epoch": 0.85, "learning_rate": 1.2178782722352932e-06, "loss": 1.4478, "step": 30979 }, { "epoch": 0.85, "learning_rate": 1.2174552722361822e-06, "loss": 1.238, "step": 30980 }, { "epoch": 0.85, "learning_rate": 1.2170323409475715e-06, "loss": 1.1396, "step": 30981 }, { "epoch": 0.85, "learning_rate": 1.2166094783727712e-06, "loss": 1.2134, "step": 30982 }, { "epoch": 0.85, "learning_rate": 1.2161866845150882e-06, "loss": 1.1567, "step": 30983 }, { "epoch": 0.85, "learning_rate": 1.215763959377827e-06, "loss": 1.2358, "step": 30984 }, { "epoch": 0.85, "learning_rate": 1.2153413029643001e-06, "loss": 1.5737, "step": 30985 }, { "epoch": 0.85, "learning_rate": 1.214918715277813e-06, "loss": 1.3879, "step": 30986 }, { "epoch": 0.85, "learning_rate": 1.2144961963216683e-06, "loss": 1.1748, "step": 30987 }, { "epoch": 0.85, "learning_rate": 1.214073746099176e-06, "loss": 1.1653, "step": 30988 }, { "epoch": 0.85, "learning_rate": 1.2136513646136371e-06, "loss": 1.0859, "step": 30989 }, { "epoch": 0.85, "learning_rate": 1.213229051868363e-06, "loss": 1.071, "step": 30990 }, { "epoch": 0.85, "learning_rate": 1.2128068078666488e-06, "loss": 1.3083, "step": 30991 }, { "epoch": 0.85, "learning_rate": 1.2123846326118038e-06, "loss": 1.1548, "step": 30992 }, { "epoch": 0.85, "learning_rate": 1.2119625261071266e-06, "loss": 1.3547, "step": 30993 }, { "epoch": 0.85, "learning_rate": 1.2115404883559267e-06, "loss": 1.2471, "step": 30994 }, { "epoch": 0.85, "learning_rate": 1.2111185193614983e-06, "loss": 1.7339, "step": 30995 }, { "epoch": 0.85, "learning_rate": 1.2106966191271462e-06, "loss": 1.1985, "step": 30996 }, { "epoch": 0.85, "learning_rate": 1.2102747876561704e-06, "loss": 1.1372, "step": 30997 }, { "epoch": 0.85, "learning_rate": 1.2098530249518748e-06, "loss": 1.1235, "step": 30998 }, { "epoch": 0.85, "learning_rate": 1.209431331017551e-06, "loss": 1.2258, "step": 30999 }, { "epoch": 0.85, "learning_rate": 1.2090097058565053e-06, "loss": 1.176, "step": 31000 }, { "epoch": 0.85, "learning_rate": 1.208588149472032e-06, "loss": 1.0934, "step": 31001 }, { "epoch": 0.85, "learning_rate": 1.2081666618674348e-06, "loss": 1.1412, "step": 31002 }, { "epoch": 0.85, "learning_rate": 1.2077452430460034e-06, "loss": 1.3621, "step": 31003 }, { "epoch": 0.85, "learning_rate": 1.2073238930110388e-06, "loss": 1.0432, "step": 31004 }, { "epoch": 0.85, "learning_rate": 1.20690261176584e-06, "loss": 1.2625, "step": 31005 }, { "epoch": 0.85, "learning_rate": 1.2064813993136993e-06, "loss": 1.2329, "step": 31006 }, { "epoch": 0.85, "learning_rate": 1.2060602556579137e-06, "loss": 1.3242, "step": 31007 }, { "epoch": 0.85, "learning_rate": 1.2056391808017753e-06, "loss": 1.3127, "step": 31008 }, { "epoch": 0.85, "learning_rate": 1.2052181747485836e-06, "loss": 1.2686, "step": 31009 }, { "epoch": 0.85, "learning_rate": 1.204797237501628e-06, "loss": 1.3535, "step": 31010 }, { "epoch": 0.85, "learning_rate": 1.204376369064204e-06, "loss": 1.2942, "step": 31011 }, { "epoch": 0.85, "learning_rate": 1.2039555694396011e-06, "loss": 1.0835, "step": 31012 }, { "epoch": 0.85, "learning_rate": 1.203534838631115e-06, "loss": 1.751, "step": 31013 }, { "epoch": 0.85, "learning_rate": 1.2031141766420363e-06, "loss": 1.2866, "step": 31014 }, { "epoch": 0.85, "learning_rate": 1.2026935834756559e-06, "loss": 1.2344, "step": 31015 }, { "epoch": 0.85, "learning_rate": 1.2022730591352615e-06, "loss": 1.416, "step": 31016 }, { "epoch": 0.85, "learning_rate": 1.2018526036241485e-06, "loss": 1.397, "step": 31017 }, { "epoch": 0.85, "learning_rate": 1.2014322169456028e-06, "loss": 1.3262, "step": 31018 }, { "epoch": 0.85, "learning_rate": 1.2010118991029118e-06, "loss": 1.3921, "step": 31019 }, { "epoch": 0.85, "learning_rate": 1.2005916500993686e-06, "loss": 1.1687, "step": 31020 }, { "epoch": 0.85, "learning_rate": 1.2001714699382594e-06, "loss": 1.2634, "step": 31021 }, { "epoch": 0.85, "learning_rate": 1.1997513586228694e-06, "loss": 1.7471, "step": 31022 }, { "epoch": 0.85, "learning_rate": 1.1993313161564857e-06, "loss": 1.2771, "step": 31023 }, { "epoch": 0.85, "learning_rate": 1.198911342542397e-06, "loss": 1.239, "step": 31024 }, { "epoch": 0.85, "learning_rate": 1.1984914377838862e-06, "loss": 1.095, "step": 31025 }, { "epoch": 0.85, "learning_rate": 1.1980716018842408e-06, "loss": 1.2302, "step": 31026 }, { "epoch": 0.85, "learning_rate": 1.1976518348467426e-06, "loss": 1.1738, "step": 31027 }, { "epoch": 0.85, "learning_rate": 1.1972321366746787e-06, "loss": 1.2285, "step": 31028 }, { "epoch": 0.85, "learning_rate": 1.196812507371331e-06, "loss": 1.345, "step": 31029 }, { "epoch": 0.85, "learning_rate": 1.1963929469399837e-06, "loss": 1.259, "step": 31030 }, { "epoch": 0.85, "learning_rate": 1.1959734553839154e-06, "loss": 1.3787, "step": 31031 }, { "epoch": 0.85, "learning_rate": 1.195554032706413e-06, "loss": 1.291, "step": 31032 }, { "epoch": 0.85, "learning_rate": 1.1951346789107555e-06, "loss": 1.3318, "step": 31033 }, { "epoch": 0.85, "learning_rate": 1.194715394000222e-06, "loss": 1.2791, "step": 31034 }, { "epoch": 0.85, "learning_rate": 1.194296177978097e-06, "loss": 1.4062, "step": 31035 }, { "epoch": 0.85, "learning_rate": 1.1938770308476555e-06, "loss": 1.2947, "step": 31036 }, { "epoch": 0.85, "learning_rate": 1.1934579526121836e-06, "loss": 1.2703, "step": 31037 }, { "epoch": 0.85, "learning_rate": 1.193038943274951e-06, "loss": 1.064, "step": 31038 }, { "epoch": 0.85, "learning_rate": 1.1926200028392432e-06, "loss": 1.2737, "step": 31039 }, { "epoch": 0.85, "learning_rate": 1.1922011313083327e-06, "loss": 1.3042, "step": 31040 }, { "epoch": 0.85, "learning_rate": 1.1917823286855002e-06, "loss": 1.2627, "step": 31041 }, { "epoch": 0.85, "learning_rate": 1.191363594974022e-06, "loss": 1.1785, "step": 31042 }, { "epoch": 0.85, "learning_rate": 1.1909449301771724e-06, "loss": 1.2231, "step": 31043 }, { "epoch": 0.85, "learning_rate": 1.1905263342982243e-06, "loss": 1.2471, "step": 31044 }, { "epoch": 0.85, "learning_rate": 1.1901078073404593e-06, "loss": 1.1367, "step": 31045 }, { "epoch": 0.85, "learning_rate": 1.189689349307147e-06, "loss": 1.1562, "step": 31046 }, { "epoch": 0.85, "learning_rate": 1.1892709602015628e-06, "loss": 1.2244, "step": 31047 }, { "epoch": 0.85, "learning_rate": 1.1888526400269773e-06, "loss": 1.1401, "step": 31048 }, { "epoch": 0.85, "learning_rate": 1.1884343887866678e-06, "loss": 1.3538, "step": 31049 }, { "epoch": 0.85, "learning_rate": 1.188016206483904e-06, "loss": 1.3008, "step": 31050 }, { "epoch": 0.85, "learning_rate": 1.1875980931219554e-06, "loss": 1.2854, "step": 31051 }, { "epoch": 0.85, "learning_rate": 1.1871800487040986e-06, "loss": 1.7422, "step": 31052 }, { "epoch": 0.85, "learning_rate": 1.1867620732335994e-06, "loss": 1.2385, "step": 31053 }, { "epoch": 0.85, "learning_rate": 1.18634416671373e-06, "loss": 1.3254, "step": 31054 }, { "epoch": 0.85, "learning_rate": 1.1859263291477573e-06, "loss": 1.3752, "step": 31055 }, { "epoch": 0.85, "learning_rate": 1.1855085605389548e-06, "loss": 1.2419, "step": 31056 }, { "epoch": 0.85, "learning_rate": 1.1850908608905886e-06, "loss": 1.3401, "step": 31057 }, { "epoch": 0.85, "learning_rate": 1.1846732302059261e-06, "loss": 1.0298, "step": 31058 }, { "epoch": 0.85, "learning_rate": 1.1842556684882333e-06, "loss": 1.2324, "step": 31059 }, { "epoch": 0.85, "learning_rate": 1.1838381757407802e-06, "loss": 1.3064, "step": 31060 }, { "epoch": 0.85, "learning_rate": 1.1834207519668317e-06, "loss": 1.2424, "step": 31061 }, { "epoch": 0.85, "learning_rate": 1.1830033971696532e-06, "loss": 1.3381, "step": 31062 }, { "epoch": 0.85, "learning_rate": 1.1825861113525083e-06, "loss": 1.0823, "step": 31063 }, { "epoch": 0.85, "learning_rate": 1.182168894518666e-06, "loss": 1.3179, "step": 31064 }, { "epoch": 0.85, "learning_rate": 1.1817517466713868e-06, "loss": 1.3484, "step": 31065 }, { "epoch": 0.85, "learning_rate": 1.1813346678139338e-06, "loss": 1.3772, "step": 31066 }, { "epoch": 0.85, "learning_rate": 1.1809176579495728e-06, "loss": 1.302, "step": 31067 }, { "epoch": 0.85, "learning_rate": 1.1805007170815662e-06, "loss": 1.2859, "step": 31068 }, { "epoch": 0.85, "learning_rate": 1.1800838452131746e-06, "loss": 1.2275, "step": 31069 }, { "epoch": 0.85, "learning_rate": 1.1796670423476575e-06, "loss": 1.3994, "step": 31070 }, { "epoch": 0.85, "learning_rate": 1.179250308488279e-06, "loss": 1.2336, "step": 31071 }, { "epoch": 0.85, "learning_rate": 1.1788336436382974e-06, "loss": 1.4072, "step": 31072 }, { "epoch": 0.85, "learning_rate": 1.1784170478009771e-06, "loss": 1.2278, "step": 31073 }, { "epoch": 0.85, "learning_rate": 1.1780005209795686e-06, "loss": 1.5093, "step": 31074 }, { "epoch": 0.85, "learning_rate": 1.1775840631773383e-06, "loss": 1.1519, "step": 31075 }, { "epoch": 0.85, "learning_rate": 1.1771676743975403e-06, "loss": 1.2839, "step": 31076 }, { "epoch": 0.85, "learning_rate": 1.1767513546434372e-06, "loss": 1.1682, "step": 31077 }, { "epoch": 0.85, "learning_rate": 1.176335103918278e-06, "loss": 1.2571, "step": 31078 }, { "epoch": 0.85, "learning_rate": 1.1759189222253265e-06, "loss": 1.1597, "step": 31079 }, { "epoch": 0.85, "learning_rate": 1.1755028095678335e-06, "loss": 1.0742, "step": 31080 }, { "epoch": 0.85, "learning_rate": 1.1750867659490595e-06, "loss": 1.2881, "step": 31081 }, { "epoch": 0.85, "learning_rate": 1.1746707913722566e-06, "loss": 1.3235, "step": 31082 }, { "epoch": 0.85, "learning_rate": 1.1742548858406767e-06, "loss": 1.3379, "step": 31083 }, { "epoch": 0.85, "learning_rate": 1.1738390493575792e-06, "loss": 1.394, "step": 31084 }, { "epoch": 0.85, "learning_rate": 1.1734232819262148e-06, "loss": 1.1467, "step": 31085 }, { "epoch": 0.85, "learning_rate": 1.1730075835498357e-06, "loss": 1.6782, "step": 31086 }, { "epoch": 0.85, "learning_rate": 1.1725919542316921e-06, "loss": 1.2759, "step": 31087 }, { "epoch": 0.85, "learning_rate": 1.1721763939750408e-06, "loss": 1.2373, "step": 31088 }, { "epoch": 0.85, "learning_rate": 1.17176090278313e-06, "loss": 1.2935, "step": 31089 }, { "epoch": 0.85, "learning_rate": 1.1713454806592118e-06, "loss": 1.2573, "step": 31090 }, { "epoch": 0.85, "learning_rate": 1.170930127606531e-06, "loss": 1.0623, "step": 31091 }, { "epoch": 0.85, "learning_rate": 1.1705148436283443e-06, "loss": 1.374, "step": 31092 }, { "epoch": 0.85, "learning_rate": 1.1700996287278977e-06, "loss": 1.0999, "step": 31093 }, { "epoch": 0.85, "learning_rate": 1.1696844829084386e-06, "loss": 1.2205, "step": 31094 }, { "epoch": 0.85, "learning_rate": 1.1692694061732146e-06, "loss": 1.3367, "step": 31095 }, { "epoch": 0.85, "learning_rate": 1.1688543985254763e-06, "loss": 1.1743, "step": 31096 }, { "epoch": 0.85, "learning_rate": 1.1684394599684678e-06, "loss": 1.1389, "step": 31097 }, { "epoch": 0.85, "learning_rate": 1.1680245905054344e-06, "loss": 1.4524, "step": 31098 }, { "epoch": 0.85, "learning_rate": 1.1676097901396255e-06, "loss": 1.2876, "step": 31099 }, { "epoch": 0.85, "learning_rate": 1.1671950588742842e-06, "loss": 1.3296, "step": 31100 }, { "epoch": 0.85, "learning_rate": 1.1667803967126556e-06, "loss": 1.1611, "step": 31101 }, { "epoch": 0.85, "learning_rate": 1.1663658036579817e-06, "loss": 1.1782, "step": 31102 }, { "epoch": 0.85, "learning_rate": 1.1659512797135098e-06, "loss": 1.2266, "step": 31103 }, { "epoch": 0.85, "learning_rate": 1.1655368248824805e-06, "loss": 1.2305, "step": 31104 }, { "epoch": 0.85, "learning_rate": 1.1651224391681372e-06, "loss": 1.3289, "step": 31105 }, { "epoch": 0.85, "learning_rate": 1.164708122573719e-06, "loss": 1.2463, "step": 31106 }, { "epoch": 0.85, "learning_rate": 1.1642938751024723e-06, "loss": 1.2852, "step": 31107 }, { "epoch": 0.85, "learning_rate": 1.163879696757635e-06, "loss": 1.165, "step": 31108 }, { "epoch": 0.85, "learning_rate": 1.1634655875424483e-06, "loss": 1.2712, "step": 31109 }, { "epoch": 0.85, "learning_rate": 1.16305154746015e-06, "loss": 1.2112, "step": 31110 }, { "epoch": 0.85, "learning_rate": 1.162637576513981e-06, "loss": 1.376, "step": 31111 }, { "epoch": 0.85, "learning_rate": 1.1622236747071835e-06, "loss": 1.2949, "step": 31112 }, { "epoch": 0.85, "learning_rate": 1.161809842042988e-06, "loss": 1.218, "step": 31113 }, { "epoch": 0.85, "learning_rate": 1.161396078524638e-06, "loss": 1.2817, "step": 31114 }, { "epoch": 0.85, "learning_rate": 1.1609823841553681e-06, "loss": 1.4438, "step": 31115 }, { "epoch": 0.85, "learning_rate": 1.1605687589384184e-06, "loss": 1.2341, "step": 31116 }, { "epoch": 0.85, "learning_rate": 1.160155202877019e-06, "loss": 1.2405, "step": 31117 }, { "epoch": 0.85, "learning_rate": 1.1597417159744095e-06, "loss": 1.2783, "step": 31118 }, { "epoch": 0.85, "learning_rate": 1.1593282982338228e-06, "loss": 1.2505, "step": 31119 }, { "epoch": 0.85, "learning_rate": 1.1589149496584984e-06, "loss": 1.2079, "step": 31120 }, { "epoch": 0.85, "learning_rate": 1.1585016702516617e-06, "loss": 1.156, "step": 31121 }, { "epoch": 0.85, "learning_rate": 1.1580884600165521e-06, "loss": 1.1068, "step": 31122 }, { "epoch": 0.85, "learning_rate": 1.1576753189563982e-06, "loss": 1.1934, "step": 31123 }, { "epoch": 0.85, "learning_rate": 1.1572622470744399e-06, "loss": 1.2629, "step": 31124 }, { "epoch": 0.85, "learning_rate": 1.1568492443738988e-06, "loss": 1.2637, "step": 31125 }, { "epoch": 0.85, "learning_rate": 1.1564363108580135e-06, "loss": 1.2861, "step": 31126 }, { "epoch": 0.85, "learning_rate": 1.156023446530009e-06, "loss": 1.3342, "step": 31127 }, { "epoch": 0.85, "learning_rate": 1.155610651393121e-06, "loss": 1.2773, "step": 31128 }, { "epoch": 0.85, "learning_rate": 1.1551979254505764e-06, "loss": 1.3691, "step": 31129 }, { "epoch": 0.85, "learning_rate": 1.1547852687056016e-06, "loss": 1.3879, "step": 31130 }, { "epoch": 0.85, "learning_rate": 1.1543726811614297e-06, "loss": 1.2261, "step": 31131 }, { "epoch": 0.85, "learning_rate": 1.1539601628212872e-06, "loss": 1.2456, "step": 31132 }, { "epoch": 0.85, "learning_rate": 1.1535477136884e-06, "loss": 1.1855, "step": 31133 }, { "epoch": 0.85, "learning_rate": 1.1531353337659935e-06, "loss": 1.3533, "step": 31134 }, { "epoch": 0.85, "learning_rate": 1.1527230230572984e-06, "loss": 1.3936, "step": 31135 }, { "epoch": 0.85, "learning_rate": 1.1523107815655376e-06, "loss": 1.2993, "step": 31136 }, { "epoch": 0.85, "learning_rate": 1.1518986092939377e-06, "loss": 1.3137, "step": 31137 }, { "epoch": 0.85, "learning_rate": 1.1514865062457193e-06, "loss": 1.2212, "step": 31138 }, { "epoch": 0.85, "learning_rate": 1.151074472424113e-06, "loss": 1.1553, "step": 31139 }, { "epoch": 0.85, "learning_rate": 1.1506625078323375e-06, "loss": 1.2577, "step": 31140 }, { "epoch": 0.85, "learning_rate": 1.1502506124736179e-06, "loss": 1.3452, "step": 31141 }, { "epoch": 0.85, "learning_rate": 1.149838786351174e-06, "loss": 1.2847, "step": 31142 }, { "epoch": 0.85, "learning_rate": 1.1494270294682318e-06, "loss": 1.0957, "step": 31143 }, { "epoch": 0.85, "learning_rate": 1.1490153418280115e-06, "loss": 1.2415, "step": 31144 }, { "epoch": 0.85, "learning_rate": 1.14860372343373e-06, "loss": 1.2825, "step": 31145 }, { "epoch": 0.85, "learning_rate": 1.1481921742886126e-06, "loss": 1.1235, "step": 31146 }, { "epoch": 0.85, "learning_rate": 1.1477806943958781e-06, "loss": 1.2024, "step": 31147 }, { "epoch": 0.85, "learning_rate": 1.1473692837587447e-06, "loss": 1.386, "step": 31148 }, { "epoch": 0.85, "learning_rate": 1.1469579423804289e-06, "loss": 1.1165, "step": 31149 }, { "epoch": 0.85, "learning_rate": 1.1465466702641536e-06, "loss": 1.1772, "step": 31150 }, { "epoch": 0.85, "learning_rate": 1.146135467413133e-06, "loss": 1.3562, "step": 31151 }, { "epoch": 0.85, "learning_rate": 1.1457243338305856e-06, "loss": 1.075, "step": 31152 }, { "epoch": 0.85, "learning_rate": 1.1453132695197267e-06, "loss": 1.3364, "step": 31153 }, { "epoch": 0.85, "learning_rate": 1.1449022744837734e-06, "loss": 1.3608, "step": 31154 }, { "epoch": 0.85, "learning_rate": 1.1444913487259413e-06, "loss": 1.2683, "step": 31155 }, { "epoch": 0.85, "learning_rate": 1.1440804922494442e-06, "loss": 1.2629, "step": 31156 }, { "epoch": 0.85, "learning_rate": 1.1436697050574962e-06, "loss": 1.123, "step": 31157 }, { "epoch": 0.85, "learning_rate": 1.1432589871533105e-06, "loss": 1.3364, "step": 31158 }, { "epoch": 0.85, "learning_rate": 1.1428483385401069e-06, "loss": 1.3848, "step": 31159 }, { "epoch": 0.85, "learning_rate": 1.1424377592210889e-06, "loss": 1.2639, "step": 31160 }, { "epoch": 0.85, "learning_rate": 1.1420272491994744e-06, "loss": 1.0815, "step": 31161 }, { "epoch": 0.85, "learning_rate": 1.1416168084784707e-06, "loss": 1.4089, "step": 31162 }, { "epoch": 0.85, "learning_rate": 1.1412064370612963e-06, "loss": 1.0806, "step": 31163 }, { "epoch": 0.85, "learning_rate": 1.140796134951153e-06, "loss": 1.3008, "step": 31164 }, { "epoch": 0.85, "learning_rate": 1.1403859021512564e-06, "loss": 1.2642, "step": 31165 }, { "epoch": 0.85, "learning_rate": 1.1399757386648137e-06, "loss": 1.0286, "step": 31166 }, { "epoch": 0.85, "learning_rate": 1.1395656444950376e-06, "loss": 1.1896, "step": 31167 }, { "epoch": 0.85, "learning_rate": 1.1391556196451292e-06, "loss": 1.2161, "step": 31168 }, { "epoch": 0.85, "learning_rate": 1.1387456641183026e-06, "loss": 1.1523, "step": 31169 }, { "epoch": 0.85, "learning_rate": 1.1383357779177617e-06, "loss": 1.8081, "step": 31170 }, { "epoch": 0.85, "learning_rate": 1.1379259610467185e-06, "loss": 1.1987, "step": 31171 }, { "epoch": 0.85, "learning_rate": 1.1375162135083705e-06, "loss": 1.2766, "step": 31172 }, { "epoch": 0.85, "learning_rate": 1.1371065353059296e-06, "loss": 1.2407, "step": 31173 }, { "epoch": 0.85, "learning_rate": 1.1366969264425998e-06, "loss": 1.1077, "step": 31174 }, { "epoch": 0.85, "learning_rate": 1.1362873869215873e-06, "loss": 1.3462, "step": 31175 }, { "epoch": 0.85, "learning_rate": 1.1358779167460932e-06, "loss": 1.3118, "step": 31176 }, { "epoch": 0.85, "learning_rate": 1.1354685159193202e-06, "loss": 1.2415, "step": 31177 }, { "epoch": 0.85, "learning_rate": 1.1350591844444747e-06, "loss": 1.2993, "step": 31178 }, { "epoch": 0.85, "learning_rate": 1.1346499223247587e-06, "loss": 1.1028, "step": 31179 }, { "epoch": 0.85, "learning_rate": 1.1342407295633717e-06, "loss": 1.2556, "step": 31180 }, { "epoch": 0.85, "learning_rate": 1.1338316061635146e-06, "loss": 1.2565, "step": 31181 }, { "epoch": 0.85, "learning_rate": 1.1334225521283925e-06, "loss": 1.3774, "step": 31182 }, { "epoch": 0.85, "learning_rate": 1.133013567461203e-06, "loss": 1.1624, "step": 31183 }, { "epoch": 0.85, "learning_rate": 1.1326046521651446e-06, "loss": 1.1985, "step": 31184 }, { "epoch": 0.85, "learning_rate": 1.132195806243417e-06, "loss": 1.2639, "step": 31185 }, { "epoch": 0.85, "learning_rate": 1.1317870296992206e-06, "loss": 1.1755, "step": 31186 }, { "epoch": 0.85, "learning_rate": 1.1313783225357532e-06, "loss": 1.4155, "step": 31187 }, { "epoch": 0.85, "learning_rate": 1.1309696847562103e-06, "loss": 1.3623, "step": 31188 }, { "epoch": 0.85, "learning_rate": 1.1305611163637886e-06, "loss": 1.3064, "step": 31189 }, { "epoch": 0.85, "learning_rate": 1.1301526173616883e-06, "loss": 1.3423, "step": 31190 }, { "epoch": 0.85, "learning_rate": 1.1297441877531034e-06, "loss": 1.4172, "step": 31191 }, { "epoch": 0.85, "learning_rate": 1.1293358275412259e-06, "loss": 1.3284, "step": 31192 }, { "epoch": 0.85, "learning_rate": 1.1289275367292562e-06, "loss": 1.4053, "step": 31193 }, { "epoch": 0.85, "learning_rate": 1.1285193153203855e-06, "loss": 1.3884, "step": 31194 }, { "epoch": 0.85, "learning_rate": 1.1281111633178089e-06, "loss": 1.2893, "step": 31195 }, { "epoch": 0.85, "learning_rate": 1.1277030807247159e-06, "loss": 1.1785, "step": 31196 }, { "epoch": 0.85, "learning_rate": 1.127295067544304e-06, "loss": 1.2634, "step": 31197 }, { "epoch": 0.85, "learning_rate": 1.126887123779764e-06, "loss": 1.3049, "step": 31198 }, { "epoch": 0.85, "learning_rate": 1.1264792494342858e-06, "loss": 1.2512, "step": 31199 }, { "epoch": 0.85, "learning_rate": 1.12607144451106e-06, "loss": 1.2637, "step": 31200 }, { "epoch": 0.85, "learning_rate": 1.1256637090132794e-06, "loss": 1.1248, "step": 31201 }, { "epoch": 0.85, "learning_rate": 1.1252560429441339e-06, "loss": 1.2944, "step": 31202 }, { "epoch": 0.85, "learning_rate": 1.124848446306812e-06, "loss": 1.0898, "step": 31203 }, { "epoch": 0.85, "learning_rate": 1.1244409191045002e-06, "loss": 1.2874, "step": 31204 }, { "epoch": 0.85, "learning_rate": 1.1240334613403892e-06, "loss": 1.3628, "step": 31205 }, { "epoch": 0.85, "learning_rate": 1.1236260730176695e-06, "loss": 1.0139, "step": 31206 }, { "epoch": 0.85, "learning_rate": 1.1232187541395224e-06, "loss": 1.3215, "step": 31207 }, { "epoch": 0.85, "learning_rate": 1.1228115047091403e-06, "loss": 1.2026, "step": 31208 }, { "epoch": 0.85, "learning_rate": 1.1224043247297035e-06, "loss": 1.343, "step": 31209 }, { "epoch": 0.85, "learning_rate": 1.1219972142044056e-06, "loss": 1.2146, "step": 31210 }, { "epoch": 0.85, "learning_rate": 1.121590173136422e-06, "loss": 1.4421, "step": 31211 }, { "epoch": 0.85, "learning_rate": 1.1211832015289449e-06, "loss": 1.1724, "step": 31212 }, { "epoch": 0.85, "learning_rate": 1.1207762993851523e-06, "loss": 1.1614, "step": 31213 }, { "epoch": 0.85, "learning_rate": 1.1203694667082344e-06, "loss": 1.0703, "step": 31214 }, { "epoch": 0.85, "learning_rate": 1.119962703501367e-06, "loss": 1.1853, "step": 31215 }, { "epoch": 0.85, "learning_rate": 1.1195560097677382e-06, "loss": 1.2251, "step": 31216 }, { "epoch": 0.85, "learning_rate": 1.119149385510524e-06, "loss": 1.1675, "step": 31217 }, { "epoch": 0.85, "learning_rate": 1.118742830732914e-06, "loss": 1.4065, "step": 31218 }, { "epoch": 0.85, "learning_rate": 1.118336345438079e-06, "loss": 1.7183, "step": 31219 }, { "epoch": 0.85, "learning_rate": 1.1179299296292046e-06, "loss": 1.3052, "step": 31220 }, { "epoch": 0.85, "learning_rate": 1.1175235833094722e-06, "loss": 1.1897, "step": 31221 }, { "epoch": 0.85, "learning_rate": 1.1171173064820572e-06, "loss": 1.1775, "step": 31222 }, { "epoch": 0.85, "learning_rate": 1.1167110991501406e-06, "loss": 1.3936, "step": 31223 }, { "epoch": 0.85, "learning_rate": 1.1163049613168963e-06, "loss": 1.1245, "step": 31224 }, { "epoch": 0.85, "learning_rate": 1.1158988929855074e-06, "loss": 1.3198, "step": 31225 }, { "epoch": 0.85, "learning_rate": 1.115492894159147e-06, "loss": 1.3083, "step": 31226 }, { "epoch": 0.85, "learning_rate": 1.1150869648409935e-06, "loss": 1.6069, "step": 31227 }, { "epoch": 0.85, "learning_rate": 1.1146811050342187e-06, "loss": 1.3127, "step": 31228 }, { "epoch": 0.85, "learning_rate": 1.1142753147420027e-06, "loss": 1.1868, "step": 31229 }, { "epoch": 0.85, "learning_rate": 1.1138695939675193e-06, "loss": 1.2715, "step": 31230 }, { "epoch": 0.85, "learning_rate": 1.1134639427139404e-06, "loss": 1.241, "step": 31231 }, { "epoch": 0.85, "learning_rate": 1.1130583609844402e-06, "loss": 1.1687, "step": 31232 }, { "epoch": 0.85, "learning_rate": 1.112652848782193e-06, "loss": 1.2856, "step": 31233 }, { "epoch": 0.85, "learning_rate": 1.1122474061103717e-06, "loss": 1.272, "step": 31234 }, { "epoch": 0.85, "learning_rate": 1.1118420329721468e-06, "loss": 1.3533, "step": 31235 }, { "epoch": 0.85, "learning_rate": 1.1114367293706896e-06, "loss": 1.2415, "step": 31236 }, { "epoch": 0.85, "learning_rate": 1.1110314953091728e-06, "loss": 1.3523, "step": 31237 }, { "epoch": 0.85, "learning_rate": 1.110626330790765e-06, "loss": 1.1116, "step": 31238 }, { "epoch": 0.85, "learning_rate": 1.110221235818636e-06, "loss": 0.991, "step": 31239 }, { "epoch": 0.85, "learning_rate": 1.1098162103959564e-06, "loss": 1.2708, "step": 31240 }, { "epoch": 0.85, "learning_rate": 1.109411254525895e-06, "loss": 1.3362, "step": 31241 }, { "epoch": 0.85, "learning_rate": 1.1090063682116203e-06, "loss": 1.3245, "step": 31242 }, { "epoch": 0.85, "learning_rate": 1.1086015514562952e-06, "loss": 1.1912, "step": 31243 }, { "epoch": 0.85, "learning_rate": 1.1081968042630942e-06, "loss": 1.2588, "step": 31244 }, { "epoch": 0.85, "learning_rate": 1.1077921266351788e-06, "loss": 1.2458, "step": 31245 }, { "epoch": 0.85, "learning_rate": 1.1073875185757177e-06, "loss": 1.1562, "step": 31246 }, { "epoch": 0.85, "learning_rate": 1.1069829800878717e-06, "loss": 1.2996, "step": 31247 }, { "epoch": 0.85, "learning_rate": 1.1065785111748117e-06, "loss": 1.1731, "step": 31248 }, { "epoch": 0.85, "learning_rate": 1.1061741118396996e-06, "loss": 1.353, "step": 31249 }, { "epoch": 0.85, "learning_rate": 1.1057697820856993e-06, "loss": 1.1783, "step": 31250 }, { "epoch": 0.85, "learning_rate": 1.1053655219159709e-06, "loss": 1.1846, "step": 31251 }, { "epoch": 0.85, "learning_rate": 1.1049613313336804e-06, "loss": 1.2551, "step": 31252 }, { "epoch": 0.85, "learning_rate": 1.1045572103419944e-06, "loss": 1.2388, "step": 31253 }, { "epoch": 0.85, "learning_rate": 1.1041531589440657e-06, "loss": 1.3667, "step": 31254 }, { "epoch": 0.85, "learning_rate": 1.1037491771430608e-06, "loss": 1.1904, "step": 31255 }, { "epoch": 0.85, "learning_rate": 1.1033452649421371e-06, "loss": 1.3835, "step": 31256 }, { "epoch": 0.85, "learning_rate": 1.1029414223444612e-06, "loss": 1.2595, "step": 31257 }, { "epoch": 0.85, "learning_rate": 1.1025376493531836e-06, "loss": 1.3264, "step": 31258 }, { "epoch": 0.85, "learning_rate": 1.1021339459714697e-06, "loss": 1.3179, "step": 31259 }, { "epoch": 0.85, "learning_rate": 1.1017303122024737e-06, "loss": 1.2825, "step": 31260 }, { "epoch": 0.85, "learning_rate": 1.1013267480493596e-06, "loss": 1.1688, "step": 31261 }, { "epoch": 0.85, "learning_rate": 1.100923253515277e-06, "loss": 1.448, "step": 31262 }, { "epoch": 0.85, "learning_rate": 1.100519828603387e-06, "loss": 1.2266, "step": 31263 }, { "epoch": 0.85, "learning_rate": 1.1001164733168435e-06, "loss": 1.4045, "step": 31264 }, { "epoch": 0.85, "learning_rate": 1.0997131876588086e-06, "loss": 1.3357, "step": 31265 }, { "epoch": 0.85, "learning_rate": 1.0993099716324273e-06, "loss": 1.2334, "step": 31266 }, { "epoch": 0.85, "learning_rate": 1.0989068252408596e-06, "loss": 1.2292, "step": 31267 }, { "epoch": 0.85, "learning_rate": 1.0985037484872618e-06, "loss": 1.4043, "step": 31268 }, { "epoch": 0.85, "learning_rate": 1.0981007413747847e-06, "loss": 1.1782, "step": 31269 }, { "epoch": 0.85, "learning_rate": 1.0976978039065822e-06, "loss": 1.2288, "step": 31270 }, { "epoch": 0.85, "learning_rate": 1.097294936085803e-06, "loss": 1.4102, "step": 31271 }, { "epoch": 0.85, "learning_rate": 1.0968921379156039e-06, "loss": 1.2334, "step": 31272 }, { "epoch": 0.85, "learning_rate": 1.096489409399134e-06, "loss": 1.2612, "step": 31273 }, { "epoch": 0.85, "learning_rate": 1.0960867505395445e-06, "loss": 1.3833, "step": 31274 }, { "epoch": 0.85, "learning_rate": 1.0956841613399838e-06, "loss": 1.2683, "step": 31275 }, { "epoch": 0.85, "learning_rate": 1.0952816418036038e-06, "loss": 1.1404, "step": 31276 }, { "epoch": 0.85, "learning_rate": 1.0948791919335545e-06, "loss": 1.2507, "step": 31277 }, { "epoch": 0.85, "learning_rate": 1.0944768117329818e-06, "loss": 1.6948, "step": 31278 }, { "epoch": 0.85, "learning_rate": 1.0940745012050336e-06, "loss": 1.209, "step": 31279 }, { "epoch": 0.85, "learning_rate": 1.0936722603528605e-06, "loss": 1.2825, "step": 31280 }, { "epoch": 0.85, "learning_rate": 1.0932700891796078e-06, "loss": 1.2324, "step": 31281 }, { "epoch": 0.85, "learning_rate": 1.0928679876884186e-06, "loss": 1.1958, "step": 31282 }, { "epoch": 0.85, "learning_rate": 1.0924659558824446e-06, "loss": 1.1301, "step": 31283 }, { "epoch": 0.85, "learning_rate": 1.092063993764828e-06, "loss": 1.3054, "step": 31284 }, { "epoch": 0.85, "learning_rate": 1.091662101338714e-06, "loss": 1.3345, "step": 31285 }, { "epoch": 0.85, "learning_rate": 1.0912602786072457e-06, "loss": 1.2444, "step": 31286 }, { "epoch": 0.85, "learning_rate": 1.0908585255735692e-06, "loss": 0.99, "step": 31287 }, { "epoch": 0.85, "learning_rate": 1.0904568422408258e-06, "loss": 1.1188, "step": 31288 }, { "epoch": 0.85, "learning_rate": 1.0900552286121591e-06, "loss": 1.3354, "step": 31289 }, { "epoch": 0.85, "learning_rate": 1.089653684690708e-06, "loss": 1.196, "step": 31290 }, { "epoch": 0.85, "learning_rate": 1.0892522104796188e-06, "loss": 1.1257, "step": 31291 }, { "epoch": 0.85, "learning_rate": 1.0888508059820301e-06, "loss": 1.1165, "step": 31292 }, { "epoch": 0.85, "learning_rate": 1.0884494712010818e-06, "loss": 1.2581, "step": 31293 }, { "epoch": 0.85, "learning_rate": 1.0880482061399133e-06, "loss": 1.2117, "step": 31294 }, { "epoch": 0.85, "learning_rate": 1.0876470108016667e-06, "loss": 1.1204, "step": 31295 }, { "epoch": 0.85, "learning_rate": 1.0872458851894786e-06, "loss": 1.396, "step": 31296 }, { "epoch": 0.85, "learning_rate": 1.086844829306488e-06, "loss": 1.3428, "step": 31297 }, { "epoch": 0.85, "learning_rate": 1.08644384315583e-06, "loss": 1.1649, "step": 31298 }, { "epoch": 0.85, "learning_rate": 1.0860429267406436e-06, "loss": 1.197, "step": 31299 }, { "epoch": 0.85, "learning_rate": 1.08564208006407e-06, "loss": 1.2708, "step": 31300 }, { "epoch": 0.85, "learning_rate": 1.0852413031292375e-06, "loss": 1.2656, "step": 31301 }, { "epoch": 0.85, "learning_rate": 1.084840595939286e-06, "loss": 1.2102, "step": 31302 }, { "epoch": 0.85, "learning_rate": 1.0844399584973486e-06, "loss": 1.3647, "step": 31303 }, { "epoch": 0.85, "learning_rate": 1.0840393908065616e-06, "loss": 1.2026, "step": 31304 }, { "epoch": 0.85, "learning_rate": 1.083638892870058e-06, "loss": 1.2368, "step": 31305 }, { "epoch": 0.85, "learning_rate": 1.0832384646909723e-06, "loss": 1.239, "step": 31306 }, { "epoch": 0.85, "learning_rate": 1.0828381062724325e-06, "loss": 1.3208, "step": 31307 }, { "epoch": 0.86, "learning_rate": 1.0824378176175765e-06, "loss": 1.1992, "step": 31308 }, { "epoch": 0.86, "learning_rate": 1.082037598729533e-06, "loss": 1.2979, "step": 31309 }, { "epoch": 0.86, "learning_rate": 1.0816374496114345e-06, "loss": 1.1738, "step": 31310 }, { "epoch": 0.86, "learning_rate": 1.0812373702664092e-06, "loss": 1.2489, "step": 31311 }, { "epoch": 0.86, "learning_rate": 1.0808373606975908e-06, "loss": 1.2224, "step": 31312 }, { "epoch": 0.86, "learning_rate": 1.0804374209081058e-06, "loss": 1.1279, "step": 31313 }, { "epoch": 0.86, "learning_rate": 1.080037550901083e-06, "loss": 1.2827, "step": 31314 }, { "epoch": 0.86, "learning_rate": 1.079637750679654e-06, "loss": 1.2649, "step": 31315 }, { "epoch": 0.86, "learning_rate": 1.0792380202469444e-06, "loss": 1.0708, "step": 31316 }, { "epoch": 0.86, "learning_rate": 1.0788383596060814e-06, "loss": 1.2136, "step": 31317 }, { "epoch": 0.86, "learning_rate": 1.0784387687601904e-06, "loss": 1.3005, "step": 31318 }, { "epoch": 0.86, "learning_rate": 1.0780392477124014e-06, "loss": 1.2686, "step": 31319 }, { "epoch": 0.86, "learning_rate": 1.077639796465838e-06, "loss": 1.2742, "step": 31320 }, { "epoch": 0.86, "learning_rate": 1.0772404150236248e-06, "loss": 1.3606, "step": 31321 }, { "epoch": 0.86, "learning_rate": 1.0768411033888848e-06, "loss": 1.2666, "step": 31322 }, { "epoch": 0.86, "learning_rate": 1.0764418615647464e-06, "loss": 1.304, "step": 31323 }, { "epoch": 0.86, "learning_rate": 1.0760426895543296e-06, "loss": 1.1357, "step": 31324 }, { "epoch": 0.86, "learning_rate": 1.0756435873607595e-06, "loss": 1.2017, "step": 31325 }, { "epoch": 0.86, "learning_rate": 1.075244554987156e-06, "loss": 1.1172, "step": 31326 }, { "epoch": 0.86, "learning_rate": 1.074845592436643e-06, "loss": 1.373, "step": 31327 }, { "epoch": 0.86, "learning_rate": 1.0744466997123426e-06, "loss": 1.1931, "step": 31328 }, { "epoch": 0.86, "learning_rate": 1.0740478768173712e-06, "loss": 1.0581, "step": 31329 }, { "epoch": 0.86, "learning_rate": 1.0736491237548541e-06, "loss": 1.3032, "step": 31330 }, { "epoch": 0.86, "learning_rate": 1.0732504405279088e-06, "loss": 1.259, "step": 31331 }, { "epoch": 0.86, "learning_rate": 1.0728518271396548e-06, "loss": 1.293, "step": 31332 }, { "epoch": 0.86, "learning_rate": 1.0724532835932078e-06, "loss": 1.2634, "step": 31333 }, { "epoch": 0.86, "learning_rate": 1.0720548098916906e-06, "loss": 1.344, "step": 31334 }, { "epoch": 0.86, "learning_rate": 1.0716564060382174e-06, "loss": 1.3384, "step": 31335 }, { "epoch": 0.86, "learning_rate": 1.0712580720359068e-06, "loss": 1.1934, "step": 31336 }, { "epoch": 0.86, "learning_rate": 1.0708598078878728e-06, "loss": 1.2144, "step": 31337 }, { "epoch": 0.86, "learning_rate": 1.0704616135972346e-06, "loss": 1.228, "step": 31338 }, { "epoch": 0.86, "learning_rate": 1.0700634891671037e-06, "loss": 1.3804, "step": 31339 }, { "epoch": 0.86, "learning_rate": 1.0696654346006009e-06, "loss": 1.2664, "step": 31340 }, { "epoch": 0.86, "learning_rate": 1.0692674499008327e-06, "loss": 1.1616, "step": 31341 }, { "epoch": 0.86, "learning_rate": 1.0688695350709178e-06, "loss": 1.2339, "step": 31342 }, { "epoch": 0.86, "learning_rate": 1.0684716901139658e-06, "loss": 1.3118, "step": 31343 }, { "epoch": 0.86, "learning_rate": 1.0680739150330943e-06, "loss": 1.1262, "step": 31344 }, { "epoch": 0.86, "learning_rate": 1.067676209831412e-06, "loss": 1.3579, "step": 31345 }, { "epoch": 0.86, "learning_rate": 1.0672785745120284e-06, "loss": 1.186, "step": 31346 }, { "epoch": 0.86, "learning_rate": 1.0668810090780602e-06, "loss": 1.3374, "step": 31347 }, { "epoch": 0.86, "learning_rate": 1.0664835135326123e-06, "loss": 1.0818, "step": 31348 }, { "epoch": 0.86, "learning_rate": 1.0660860878787983e-06, "loss": 1.2349, "step": 31349 }, { "epoch": 0.86, "learning_rate": 1.0656887321197228e-06, "loss": 1.0382, "step": 31350 }, { "epoch": 0.86, "learning_rate": 1.0652914462584995e-06, "loss": 1.1541, "step": 31351 }, { "epoch": 0.86, "learning_rate": 1.0648942302982346e-06, "loss": 1.1802, "step": 31352 }, { "epoch": 0.86, "learning_rate": 1.0644970842420354e-06, "loss": 1.3374, "step": 31353 }, { "epoch": 0.86, "learning_rate": 1.0641000080930075e-06, "loss": 1.0725, "step": 31354 }, { "epoch": 0.86, "learning_rate": 1.0637030018542616e-06, "loss": 1.0891, "step": 31355 }, { "epoch": 0.86, "learning_rate": 1.0633060655289006e-06, "loss": 1.4072, "step": 31356 }, { "epoch": 0.86, "learning_rate": 1.0629091991200314e-06, "loss": 1.1746, "step": 31357 }, { "epoch": 0.86, "learning_rate": 1.0625124026307555e-06, "loss": 1.2073, "step": 31358 }, { "epoch": 0.86, "learning_rate": 1.0621156760641827e-06, "loss": 1.3533, "step": 31359 }, { "epoch": 0.86, "learning_rate": 1.061719019423413e-06, "loss": 1.3252, "step": 31360 }, { "epoch": 0.86, "learning_rate": 1.061322432711549e-06, "loss": 1.1929, "step": 31361 }, { "epoch": 0.86, "learning_rate": 1.0609259159316964e-06, "loss": 1.1415, "step": 31362 }, { "epoch": 0.86, "learning_rate": 1.060529469086956e-06, "loss": 1.2148, "step": 31363 }, { "epoch": 0.86, "learning_rate": 1.060133092180431e-06, "loss": 1.0962, "step": 31364 }, { "epoch": 0.86, "learning_rate": 1.0597367852152174e-06, "loss": 1.6826, "step": 31365 }, { "epoch": 0.86, "learning_rate": 1.0593405481944208e-06, "loss": 1.0905, "step": 31366 }, { "epoch": 0.86, "learning_rate": 1.0589443811211408e-06, "loss": 1.177, "step": 31367 }, { "epoch": 0.86, "learning_rate": 1.058548283998475e-06, "loss": 1.3196, "step": 31368 }, { "epoch": 0.86, "learning_rate": 1.058152256829521e-06, "loss": 1.2412, "step": 31369 }, { "epoch": 0.86, "learning_rate": 1.0577562996173808e-06, "loss": 1.1008, "step": 31370 }, { "epoch": 0.86, "learning_rate": 1.0573604123651504e-06, "loss": 1.177, "step": 31371 }, { "epoch": 0.86, "learning_rate": 1.0569645950759278e-06, "loss": 1.3457, "step": 31372 }, { "epoch": 0.86, "learning_rate": 1.0565688477528058e-06, "loss": 1.3279, "step": 31373 }, { "epoch": 0.86, "learning_rate": 1.0561731703988865e-06, "loss": 1.1285, "step": 31374 }, { "epoch": 0.86, "learning_rate": 1.0557775630172618e-06, "loss": 1.1667, "step": 31375 }, { "epoch": 0.86, "learning_rate": 1.0553820256110259e-06, "loss": 1.2878, "step": 31376 }, { "epoch": 0.86, "learning_rate": 1.0549865581832774e-06, "loss": 1.3149, "step": 31377 }, { "epoch": 0.86, "learning_rate": 1.0545911607371052e-06, "loss": 1.238, "step": 31378 }, { "epoch": 0.86, "learning_rate": 1.0541958332756097e-06, "loss": 1.3093, "step": 31379 }, { "epoch": 0.86, "learning_rate": 1.0538005758018756e-06, "loss": 1.3689, "step": 31380 }, { "epoch": 0.86, "learning_rate": 1.0534053883189998e-06, "loss": 1.2029, "step": 31381 }, { "epoch": 0.86, "learning_rate": 1.0530102708300727e-06, "loss": 1.1853, "step": 31382 }, { "epoch": 0.86, "learning_rate": 1.0526152233381893e-06, "loss": 1.395, "step": 31383 }, { "epoch": 0.86, "learning_rate": 1.0522202458464336e-06, "loss": 1.2493, "step": 31384 }, { "epoch": 0.86, "learning_rate": 1.0518253383579003e-06, "loss": 1.2793, "step": 31385 }, { "epoch": 0.86, "learning_rate": 1.0514305008756765e-06, "loss": 1.2332, "step": 31386 }, { "epoch": 0.86, "learning_rate": 1.0510357334028564e-06, "loss": 1.1331, "step": 31387 }, { "epoch": 0.86, "learning_rate": 1.05064103594252e-06, "loss": 1.2698, "step": 31388 }, { "epoch": 0.86, "learning_rate": 1.0502464084977626e-06, "loss": 1.2058, "step": 31389 }, { "epoch": 0.86, "learning_rate": 1.049851851071667e-06, "loss": 1.2463, "step": 31390 }, { "epoch": 0.86, "learning_rate": 1.0494573636673234e-06, "loss": 1.1323, "step": 31391 }, { "epoch": 0.86, "learning_rate": 1.0490629462878166e-06, "loss": 1.3286, "step": 31392 }, { "epoch": 0.86, "learning_rate": 1.04866859893623e-06, "loss": 1.3074, "step": 31393 }, { "epoch": 0.86, "learning_rate": 1.0482743216156544e-06, "loss": 1.134, "step": 31394 }, { "epoch": 0.86, "learning_rate": 1.0478801143291695e-06, "loss": 1.1047, "step": 31395 }, { "epoch": 0.86, "learning_rate": 1.0474859770798618e-06, "loss": 1.2388, "step": 31396 }, { "epoch": 0.86, "learning_rate": 1.0470919098708122e-06, "loss": 1.3113, "step": 31397 }, { "epoch": 0.86, "learning_rate": 1.046697912705107e-06, "loss": 1.1968, "step": 31398 }, { "epoch": 0.86, "learning_rate": 1.046303985585827e-06, "loss": 1.2756, "step": 31399 }, { "epoch": 0.86, "learning_rate": 1.0459101285160556e-06, "loss": 1.2852, "step": 31400 }, { "epoch": 0.86, "learning_rate": 1.045516341498869e-06, "loss": 1.2739, "step": 31401 }, { "epoch": 0.86, "learning_rate": 1.0451226245373546e-06, "loss": 1.302, "step": 31402 }, { "epoch": 0.86, "learning_rate": 1.0447289776345904e-06, "loss": 1.043, "step": 31403 }, { "epoch": 0.86, "learning_rate": 1.0443354007936557e-06, "loss": 1.0723, "step": 31404 }, { "epoch": 0.86, "learning_rate": 1.0439418940176272e-06, "loss": 0.9069, "step": 31405 }, { "epoch": 0.86, "learning_rate": 1.0435484573095877e-06, "loss": 1.3853, "step": 31406 }, { "epoch": 0.86, "learning_rate": 1.043155090672614e-06, "loss": 1.3774, "step": 31407 }, { "epoch": 0.86, "learning_rate": 1.04276179410978e-06, "loss": 1.1362, "step": 31408 }, { "epoch": 0.86, "learning_rate": 1.042368567624169e-06, "loss": 1.3325, "step": 31409 }, { "epoch": 0.86, "learning_rate": 1.041975411218854e-06, "loss": 1.2336, "step": 31410 }, { "epoch": 0.86, "learning_rate": 1.0415823248969104e-06, "loss": 1.2065, "step": 31411 }, { "epoch": 0.86, "learning_rate": 1.0411893086614123e-06, "loss": 1.1453, "step": 31412 }, { "epoch": 0.86, "learning_rate": 1.0407963625154382e-06, "loss": 1.1794, "step": 31413 }, { "epoch": 0.86, "learning_rate": 1.0404034864620605e-06, "loss": 1.0474, "step": 31414 }, { "epoch": 0.86, "learning_rate": 1.040010680504353e-06, "loss": 1.1919, "step": 31415 }, { "epoch": 0.86, "learning_rate": 1.0396179446453868e-06, "loss": 1.3118, "step": 31416 }, { "epoch": 0.86, "learning_rate": 1.0392252788882385e-06, "loss": 1.0852, "step": 31417 }, { "epoch": 0.86, "learning_rate": 1.0388326832359774e-06, "loss": 1.5627, "step": 31418 }, { "epoch": 0.86, "learning_rate": 1.0384401576916758e-06, "loss": 1.2991, "step": 31419 }, { "epoch": 0.86, "learning_rate": 1.0380477022584023e-06, "loss": 1.3044, "step": 31420 }, { "epoch": 0.86, "learning_rate": 1.0376553169392312e-06, "loss": 1.3367, "step": 31421 }, { "epoch": 0.86, "learning_rate": 1.037263001737231e-06, "loss": 1.302, "step": 31422 }, { "epoch": 0.86, "learning_rate": 1.0368707566554682e-06, "loss": 1.1401, "step": 31423 }, { "epoch": 0.86, "learning_rate": 1.0364785816970159e-06, "loss": 1.2131, "step": 31424 }, { "epoch": 0.86, "learning_rate": 1.0360864768649381e-06, "loss": 1.3804, "step": 31425 }, { "epoch": 0.86, "learning_rate": 1.0356944421623083e-06, "loss": 1.3545, "step": 31426 }, { "epoch": 0.86, "learning_rate": 1.035302477592186e-06, "loss": 1.1147, "step": 31427 }, { "epoch": 0.86, "learning_rate": 1.0349105831576445e-06, "loss": 1.3752, "step": 31428 }, { "epoch": 0.86, "learning_rate": 1.0345187588617445e-06, "loss": 1.2598, "step": 31429 }, { "epoch": 0.86, "learning_rate": 1.0341270047075568e-06, "loss": 1.3125, "step": 31430 }, { "epoch": 0.86, "learning_rate": 1.0337353206981404e-06, "loss": 1.4031, "step": 31431 }, { "epoch": 0.86, "learning_rate": 1.0333437068365647e-06, "loss": 1.1621, "step": 31432 }, { "epoch": 0.86, "learning_rate": 1.0329521631258887e-06, "loss": 1.4131, "step": 31433 }, { "epoch": 0.86, "learning_rate": 1.0325606895691832e-06, "loss": 1.3547, "step": 31434 }, { "epoch": 0.86, "learning_rate": 1.0321692861695021e-06, "loss": 1.2253, "step": 31435 }, { "epoch": 0.86, "learning_rate": 1.0317779529299133e-06, "loss": 1.1777, "step": 31436 }, { "epoch": 0.86, "learning_rate": 1.031386689853474e-06, "loss": 1.282, "step": 31437 }, { "epoch": 0.86, "learning_rate": 1.03099549694325e-06, "loss": 1.1577, "step": 31438 }, { "epoch": 0.86, "learning_rate": 1.0306043742023008e-06, "loss": 1.1754, "step": 31439 }, { "epoch": 0.86, "learning_rate": 1.030213321633682e-06, "loss": 1.1404, "step": 31440 }, { "epoch": 0.86, "learning_rate": 1.0298223392404594e-06, "loss": 1.2302, "step": 31441 }, { "epoch": 0.86, "learning_rate": 1.0294314270256878e-06, "loss": 1.2664, "step": 31442 }, { "epoch": 0.86, "learning_rate": 1.0290405849924269e-06, "loss": 1.1682, "step": 31443 }, { "epoch": 0.86, "learning_rate": 1.0286498131437317e-06, "loss": 1.2629, "step": 31444 }, { "epoch": 0.86, "learning_rate": 1.0282591114826645e-06, "loss": 1.3481, "step": 31445 }, { "epoch": 0.86, "learning_rate": 1.0278684800122785e-06, "loss": 1.2278, "step": 31446 }, { "epoch": 0.86, "learning_rate": 1.027477918735631e-06, "loss": 1.1858, "step": 31447 }, { "epoch": 0.86, "learning_rate": 1.027087427655774e-06, "loss": 1.2732, "step": 31448 }, { "epoch": 0.86, "learning_rate": 1.0266970067757687e-06, "loss": 1.3469, "step": 31449 }, { "epoch": 0.86, "learning_rate": 1.0263066560986656e-06, "loss": 1.2024, "step": 31450 }, { "epoch": 0.86, "learning_rate": 1.0259163756275203e-06, "loss": 1.2542, "step": 31451 }, { "epoch": 0.86, "learning_rate": 1.0255261653653837e-06, "loss": 1.2795, "step": 31452 }, { "epoch": 0.86, "learning_rate": 1.0251360253153119e-06, "loss": 1.2439, "step": 31453 }, { "epoch": 0.86, "learning_rate": 1.0247459554803552e-06, "loss": 1.2466, "step": 31454 }, { "epoch": 0.86, "learning_rate": 1.0243559558635642e-06, "loss": 1.2585, "step": 31455 }, { "epoch": 0.86, "learning_rate": 1.023966026467993e-06, "loss": 1.2644, "step": 31456 }, { "epoch": 0.86, "learning_rate": 1.0235761672966903e-06, "loss": 1.4678, "step": 31457 }, { "epoch": 0.86, "learning_rate": 1.0231863783527074e-06, "loss": 1.2764, "step": 31458 }, { "epoch": 0.86, "learning_rate": 1.0227966596390915e-06, "loss": 1.2141, "step": 31459 }, { "epoch": 0.86, "learning_rate": 1.0224070111588946e-06, "loss": 1.249, "step": 31460 }, { "epoch": 0.86, "learning_rate": 1.0220174329151632e-06, "loss": 1.3218, "step": 31461 }, { "epoch": 0.86, "learning_rate": 1.0216279249109473e-06, "loss": 1.0767, "step": 31462 }, { "epoch": 0.86, "learning_rate": 1.0212384871492887e-06, "loss": 1.3428, "step": 31463 }, { "epoch": 0.86, "learning_rate": 1.0208491196332414e-06, "loss": 1.2542, "step": 31464 }, { "epoch": 0.86, "learning_rate": 1.0204598223658479e-06, "loss": 1.3892, "step": 31465 }, { "epoch": 0.86, "learning_rate": 1.0200705953501545e-06, "loss": 1.3521, "step": 31466 }, { "epoch": 0.86, "learning_rate": 1.0196814385892029e-06, "loss": 1.2556, "step": 31467 }, { "epoch": 0.86, "learning_rate": 1.019292352086042e-06, "loss": 1.2937, "step": 31468 }, { "epoch": 0.86, "learning_rate": 1.0189033358437183e-06, "loss": 1.1504, "step": 31469 }, { "epoch": 0.86, "learning_rate": 1.0185143898652684e-06, "loss": 1.1887, "step": 31470 }, { "epoch": 0.86, "learning_rate": 1.0181255141537393e-06, "loss": 1.0669, "step": 31471 }, { "epoch": 0.86, "learning_rate": 1.0177367087121715e-06, "loss": 1.2451, "step": 31472 }, { "epoch": 0.86, "learning_rate": 1.017347973543612e-06, "loss": 1.3438, "step": 31473 }, { "epoch": 0.86, "learning_rate": 1.0169593086510932e-06, "loss": 1.189, "step": 31474 }, { "epoch": 0.86, "learning_rate": 1.0165707140376635e-06, "loss": 1.1794, "step": 31475 }, { "epoch": 0.86, "learning_rate": 1.0161821897063583e-06, "loss": 1.1675, "step": 31476 }, { "epoch": 0.86, "learning_rate": 1.015793735660222e-06, "loss": 1.2993, "step": 31477 }, { "epoch": 0.86, "learning_rate": 1.0154053519022877e-06, "loss": 1.2627, "step": 31478 }, { "epoch": 0.86, "learning_rate": 1.0150170384355996e-06, "loss": 1.1453, "step": 31479 }, { "epoch": 0.86, "learning_rate": 1.0146287952631907e-06, "loss": 1.3494, "step": 31480 }, { "epoch": 0.86, "learning_rate": 1.014240622388104e-06, "loss": 1.2817, "step": 31481 }, { "epoch": 0.86, "learning_rate": 1.0138525198133708e-06, "loss": 1.126, "step": 31482 }, { "epoch": 0.86, "learning_rate": 1.0134644875420307e-06, "loss": 1.2612, "step": 31483 }, { "epoch": 0.86, "learning_rate": 1.013076525577117e-06, "loss": 1.3193, "step": 31484 }, { "epoch": 0.86, "learning_rate": 1.012688633921669e-06, "loss": 1.2686, "step": 31485 }, { "epoch": 0.86, "learning_rate": 1.0123008125787181e-06, "loss": 1.3174, "step": 31486 }, { "epoch": 0.86, "learning_rate": 1.0119130615512984e-06, "loss": 1.3535, "step": 31487 }, { "epoch": 0.86, "learning_rate": 1.0115253808424464e-06, "loss": 1.1682, "step": 31488 }, { "epoch": 0.86, "learning_rate": 1.0111377704551916e-06, "loss": 1.1909, "step": 31489 }, { "epoch": 0.86, "learning_rate": 1.0107502303925697e-06, "loss": 1.1321, "step": 31490 }, { "epoch": 0.86, "learning_rate": 1.0103627606576083e-06, "loss": 1.2905, "step": 31491 }, { "epoch": 0.86, "learning_rate": 1.0099753612533437e-06, "loss": 1.2517, "step": 31492 }, { "epoch": 0.86, "learning_rate": 1.0095880321828044e-06, "loss": 1.282, "step": 31493 }, { "epoch": 0.86, "learning_rate": 1.0092007734490206e-06, "loss": 1.3101, "step": 31494 }, { "epoch": 0.86, "learning_rate": 1.0088135850550197e-06, "loss": 1.2952, "step": 31495 }, { "epoch": 0.86, "learning_rate": 1.0084264670038357e-06, "loss": 1.3547, "step": 31496 }, { "epoch": 0.86, "learning_rate": 1.0080394192984956e-06, "loss": 1.1936, "step": 31497 }, { "epoch": 0.86, "learning_rate": 1.0076524419420252e-06, "loss": 1.4143, "step": 31498 }, { "epoch": 0.86, "learning_rate": 1.0072655349374526e-06, "loss": 1.3315, "step": 31499 }, { "epoch": 0.86, "learning_rate": 1.0068786982878087e-06, "loss": 1.3398, "step": 31500 }, { "epoch": 0.86, "learning_rate": 1.0064919319961153e-06, "loss": 1.281, "step": 31501 }, { "epoch": 0.86, "learning_rate": 1.006105236065399e-06, "loss": 1.2825, "step": 31502 }, { "epoch": 0.86, "learning_rate": 1.0057186104986882e-06, "loss": 1.155, "step": 31503 }, { "epoch": 0.86, "learning_rate": 1.0053320552990054e-06, "loss": 1.2844, "step": 31504 }, { "epoch": 0.86, "learning_rate": 1.0049455704693744e-06, "loss": 1.1091, "step": 31505 }, { "epoch": 0.86, "learning_rate": 1.0045591560128177e-06, "loss": 1.2151, "step": 31506 }, { "epoch": 0.86, "learning_rate": 1.0041728119323624e-06, "loss": 1.3557, "step": 31507 }, { "epoch": 0.86, "learning_rate": 1.0037865382310296e-06, "loss": 1.1616, "step": 31508 }, { "epoch": 0.86, "learning_rate": 1.0034003349118394e-06, "loss": 1.2861, "step": 31509 }, { "epoch": 0.86, "learning_rate": 1.0030142019778133e-06, "loss": 1.2412, "step": 31510 }, { "epoch": 0.86, "learning_rate": 1.0026281394319748e-06, "loss": 1.2439, "step": 31511 }, { "epoch": 0.86, "learning_rate": 1.0022421472773436e-06, "loss": 1.1868, "step": 31512 }, { "epoch": 0.86, "learning_rate": 1.0018562255169383e-06, "loss": 1.281, "step": 31513 }, { "epoch": 0.86, "learning_rate": 1.0014703741537769e-06, "loss": 1.3315, "step": 31514 }, { "epoch": 0.86, "learning_rate": 1.0010845931908797e-06, "loss": 1.2671, "step": 31515 }, { "epoch": 0.86, "learning_rate": 1.000698882631269e-06, "loss": 1.3298, "step": 31516 }, { "epoch": 0.86, "learning_rate": 1.000313242477955e-06, "loss": 1.2864, "step": 31517 }, { "epoch": 0.86, "learning_rate": 9.99927672733959e-07, "loss": 1.2754, "step": 31518 }, { "epoch": 0.86, "learning_rate": 9.995421734022959e-07, "loss": 1.2354, "step": 31519 }, { "epoch": 0.86, "learning_rate": 9.991567444859861e-07, "loss": 1.2439, "step": 31520 }, { "epoch": 0.86, "learning_rate": 9.987713859880376e-07, "loss": 1.2317, "step": 31521 }, { "epoch": 0.86, "learning_rate": 9.983860979114713e-07, "loss": 1.3137, "step": 31522 }, { "epoch": 0.86, "learning_rate": 9.980008802592967e-07, "loss": 1.1841, "step": 31523 }, { "epoch": 0.86, "learning_rate": 9.976157330345348e-07, "loss": 1.335, "step": 31524 }, { "epoch": 0.86, "learning_rate": 9.972306562401902e-07, "loss": 1.2097, "step": 31525 }, { "epoch": 0.86, "learning_rate": 9.968456498792812e-07, "loss": 1.4229, "step": 31526 }, { "epoch": 0.86, "learning_rate": 9.964607139548156e-07, "loss": 1.2646, "step": 31527 }, { "epoch": 0.86, "learning_rate": 9.960758484698118e-07, "loss": 1.1438, "step": 31528 }, { "epoch": 0.86, "learning_rate": 9.956910534272734e-07, "loss": 1.1069, "step": 31529 }, { "epoch": 0.86, "learning_rate": 9.953063288302146e-07, "loss": 1.1504, "step": 31530 }, { "epoch": 0.86, "learning_rate": 9.94921674681646e-07, "loss": 1.3247, "step": 31531 }, { "epoch": 0.86, "learning_rate": 9.945370909845753e-07, "loss": 1.3164, "step": 31532 }, { "epoch": 0.86, "learning_rate": 9.941525777420125e-07, "loss": 1.2322, "step": 31533 }, { "epoch": 0.86, "learning_rate": 9.937681349569627e-07, "loss": 1.155, "step": 31534 }, { "epoch": 0.86, "learning_rate": 9.933837626324372e-07, "loss": 1.3181, "step": 31535 }, { "epoch": 0.86, "learning_rate": 9.929994607714433e-07, "loss": 1.2336, "step": 31536 }, { "epoch": 0.86, "learning_rate": 9.926152293769853e-07, "loss": 1.1975, "step": 31537 }, { "epoch": 0.86, "learning_rate": 9.922310684520685e-07, "loss": 1.1946, "step": 31538 }, { "epoch": 0.86, "learning_rate": 9.91846977999702e-07, "loss": 1.1162, "step": 31539 }, { "epoch": 0.86, "learning_rate": 9.914629580228896e-07, "loss": 1.2817, "step": 31540 }, { "epoch": 0.86, "learning_rate": 9.910790085246336e-07, "loss": 1.2329, "step": 31541 }, { "epoch": 0.86, "learning_rate": 9.90695129507938e-07, "loss": 1.2834, "step": 31542 }, { "epoch": 0.86, "learning_rate": 9.903113209758098e-07, "loss": 1.1812, "step": 31543 }, { "epoch": 0.86, "learning_rate": 9.899275829312483e-07, "loss": 1.2803, "step": 31544 }, { "epoch": 0.86, "learning_rate": 9.895439153772557e-07, "loss": 1.3184, "step": 31545 }, { "epoch": 0.86, "learning_rate": 9.891603183168342e-07, "loss": 1.4023, "step": 31546 }, { "epoch": 0.86, "learning_rate": 9.887767917529866e-07, "loss": 1.1189, "step": 31547 }, { "epoch": 0.86, "learning_rate": 9.88393335688711e-07, "loss": 1.2715, "step": 31548 }, { "epoch": 0.86, "learning_rate": 9.88009950127008e-07, "loss": 1.3439, "step": 31549 }, { "epoch": 0.86, "learning_rate": 9.876266350708785e-07, "loss": 1.1392, "step": 31550 }, { "epoch": 0.86, "learning_rate": 9.872433905233204e-07, "loss": 1.333, "step": 31551 }, { "epoch": 0.86, "learning_rate": 9.86860216487332e-07, "loss": 1.1853, "step": 31552 }, { "epoch": 0.86, "learning_rate": 9.86477112965909e-07, "loss": 1.1394, "step": 31553 }, { "epoch": 0.86, "learning_rate": 9.860940799620522e-07, "loss": 1.3098, "step": 31554 }, { "epoch": 0.86, "learning_rate": 9.85711117478757e-07, "loss": 1.1899, "step": 31555 }, { "epoch": 0.86, "learning_rate": 9.85328225519019e-07, "loss": 1.1541, "step": 31556 }, { "epoch": 0.86, "learning_rate": 9.84945404085832e-07, "loss": 1.2344, "step": 31557 }, { "epoch": 0.86, "learning_rate": 9.84562653182195e-07, "loss": 1.3201, "step": 31558 }, { "epoch": 0.86, "learning_rate": 9.841799728111012e-07, "loss": 1.1624, "step": 31559 }, { "epoch": 0.86, "learning_rate": 9.837973629755426e-07, "loss": 1.2935, "step": 31560 }, { "epoch": 0.86, "learning_rate": 9.834148236785124e-07, "loss": 1.3105, "step": 31561 }, { "epoch": 0.86, "learning_rate": 9.830323549230048e-07, "loss": 1.3145, "step": 31562 }, { "epoch": 0.86, "learning_rate": 9.826499567120162e-07, "loss": 1.1433, "step": 31563 }, { "epoch": 0.86, "learning_rate": 9.82267629048529e-07, "loss": 1.1519, "step": 31564 }, { "epoch": 0.86, "learning_rate": 9.818853719355427e-07, "loss": 1.2102, "step": 31565 }, { "epoch": 0.86, "learning_rate": 9.815031853760414e-07, "loss": 1.21, "step": 31566 }, { "epoch": 0.86, "learning_rate": 9.811210693730211e-07, "loss": 1.2786, "step": 31567 }, { "epoch": 0.86, "learning_rate": 9.80739023929469e-07, "loss": 1.3428, "step": 31568 }, { "epoch": 0.86, "learning_rate": 9.803570490483727e-07, "loss": 1.2185, "step": 31569 }, { "epoch": 0.86, "learning_rate": 9.7997514473272e-07, "loss": 1.1477, "step": 31570 }, { "epoch": 0.86, "learning_rate": 9.795933109855027e-07, "loss": 1.0892, "step": 31571 }, { "epoch": 0.86, "learning_rate": 9.792115478097052e-07, "loss": 1.2573, "step": 31572 }, { "epoch": 0.86, "learning_rate": 9.788298552083142e-07, "loss": 1.3533, "step": 31573 }, { "epoch": 0.86, "learning_rate": 9.784482331843148e-07, "loss": 1.3142, "step": 31574 }, { "epoch": 0.86, "learning_rate": 9.78066681740696e-07, "loss": 1.2849, "step": 31575 }, { "epoch": 0.86, "learning_rate": 9.776852008804417e-07, "loss": 1.2893, "step": 31576 }, { "epoch": 0.86, "learning_rate": 9.773037906065331e-07, "loss": 1.1919, "step": 31577 }, { "epoch": 0.86, "learning_rate": 9.769224509219588e-07, "loss": 1.2795, "step": 31578 }, { "epoch": 0.86, "learning_rate": 9.76541181829701e-07, "loss": 1.3589, "step": 31579 }, { "epoch": 0.86, "learning_rate": 9.761599833327407e-07, "loss": 1.0649, "step": 31580 }, { "epoch": 0.86, "learning_rate": 9.757788554340609e-07, "loss": 1.335, "step": 31581 }, { "epoch": 0.86, "learning_rate": 9.753977981366447e-07, "loss": 1.3301, "step": 31582 }, { "epoch": 0.86, "learning_rate": 9.750168114434733e-07, "loss": 1.0811, "step": 31583 }, { "epoch": 0.86, "learning_rate": 9.746358953575252e-07, "loss": 1.3477, "step": 31584 }, { "epoch": 0.86, "learning_rate": 9.742550498817814e-07, "loss": 1.2471, "step": 31585 }, { "epoch": 0.86, "learning_rate": 9.73874275019223e-07, "loss": 1.2725, "step": 31586 }, { "epoch": 0.86, "learning_rate": 9.734935707728276e-07, "loss": 1.3193, "step": 31587 }, { "epoch": 0.86, "learning_rate": 9.73112937145575e-07, "loss": 1.1907, "step": 31588 }, { "epoch": 0.86, "learning_rate": 9.727323741404393e-07, "loss": 1.2595, "step": 31589 }, { "epoch": 0.86, "learning_rate": 9.723518817604027e-07, "loss": 1.23, "step": 31590 }, { "epoch": 0.86, "learning_rate": 9.719714600084396e-07, "loss": 1.2058, "step": 31591 }, { "epoch": 0.86, "learning_rate": 9.715911088875252e-07, "loss": 1.2134, "step": 31592 }, { "epoch": 0.86, "learning_rate": 9.712108284006383e-07, "loss": 1.175, "step": 31593 }, { "epoch": 0.86, "learning_rate": 9.70830618550752e-07, "loss": 1.2322, "step": 31594 }, { "epoch": 0.86, "learning_rate": 9.704504793408409e-07, "loss": 1.2554, "step": 31595 }, { "epoch": 0.86, "learning_rate": 9.70070410773878e-07, "loss": 1.2363, "step": 31596 }, { "epoch": 0.86, "learning_rate": 9.696904128528395e-07, "loss": 1.3594, "step": 31597 }, { "epoch": 0.86, "learning_rate": 9.693104855806968e-07, "loss": 1.3303, "step": 31598 }, { "epoch": 0.86, "learning_rate": 9.689306289604228e-07, "loss": 1.2288, "step": 31599 }, { "epoch": 0.86, "learning_rate": 9.685508429949864e-07, "loss": 1.2854, "step": 31600 }, { "epoch": 0.86, "learning_rate": 9.681711276873629e-07, "loss": 1.2725, "step": 31601 }, { "epoch": 0.86, "learning_rate": 9.67791483040521e-07, "loss": 1.1221, "step": 31602 }, { "epoch": 0.86, "learning_rate": 9.67411909057434e-07, "loss": 1.2729, "step": 31603 }, { "epoch": 0.86, "learning_rate": 9.670324057410652e-07, "loss": 1.2471, "step": 31604 }, { "epoch": 0.86, "learning_rate": 9.666529730943885e-07, "loss": 1.2708, "step": 31605 }, { "epoch": 0.86, "learning_rate": 9.662736111203696e-07, "loss": 1.1936, "step": 31606 }, { "epoch": 0.86, "learning_rate": 9.658943198219828e-07, "loss": 1.366, "step": 31607 }, { "epoch": 0.86, "learning_rate": 9.655150992021856e-07, "loss": 1.2593, "step": 31608 }, { "epoch": 0.86, "learning_rate": 9.65135949263951e-07, "loss": 1.0767, "step": 31609 }, { "epoch": 0.86, "learning_rate": 9.64756870010246e-07, "loss": 1.157, "step": 31610 }, { "epoch": 0.86, "learning_rate": 9.643778614440336e-07, "loss": 1.0385, "step": 31611 }, { "epoch": 0.86, "learning_rate": 9.639989235682812e-07, "loss": 1.3381, "step": 31612 }, { "epoch": 0.86, "learning_rate": 9.636200563859498e-07, "loss": 1.1792, "step": 31613 }, { "epoch": 0.86, "learning_rate": 9.632412599000074e-07, "loss": 1.3243, "step": 31614 }, { "epoch": 0.86, "learning_rate": 9.628625341134168e-07, "loss": 1.3779, "step": 31615 }, { "epoch": 0.86, "learning_rate": 9.624838790291392e-07, "loss": 1.2395, "step": 31616 }, { "epoch": 0.86, "learning_rate": 9.621052946501363e-07, "loss": 1.3928, "step": 31617 }, { "epoch": 0.86, "learning_rate": 9.61726780979374e-07, "loss": 1.1628, "step": 31618 }, { "epoch": 0.86, "learning_rate": 9.613483380198109e-07, "loss": 1.1848, "step": 31619 }, { "epoch": 0.86, "learning_rate": 9.609699657744088e-07, "loss": 1.1235, "step": 31620 }, { "epoch": 0.86, "learning_rate": 9.605916642461245e-07, "loss": 1.2029, "step": 31621 }, { "epoch": 0.86, "learning_rate": 9.60213433437923e-07, "loss": 1.1296, "step": 31622 }, { "epoch": 0.86, "learning_rate": 9.598352733527605e-07, "loss": 1.2773, "step": 31623 }, { "epoch": 0.86, "learning_rate": 9.59457183993594e-07, "loss": 1.2664, "step": 31624 }, { "epoch": 0.86, "learning_rate": 9.590791653633847e-07, "loss": 1.094, "step": 31625 }, { "epoch": 0.86, "learning_rate": 9.58701217465089e-07, "loss": 1.3188, "step": 31626 }, { "epoch": 0.86, "learning_rate": 9.583233403016633e-07, "loss": 1.3718, "step": 31627 }, { "epoch": 0.86, "learning_rate": 9.579455338760623e-07, "loss": 1.2339, "step": 31628 }, { "epoch": 0.86, "learning_rate": 9.575677981912457e-07, "loss": 1.2278, "step": 31629 }, { "epoch": 0.86, "learning_rate": 9.571901332501665e-07, "loss": 1.1034, "step": 31630 }, { "epoch": 0.86, "learning_rate": 9.568125390557802e-07, "loss": 1.1992, "step": 31631 }, { "epoch": 0.86, "learning_rate": 9.56435015611037e-07, "loss": 1.251, "step": 31632 }, { "epoch": 0.86, "learning_rate": 9.560575629188961e-07, "loss": 1.3042, "step": 31633 }, { "epoch": 0.86, "learning_rate": 9.55680180982308e-07, "loss": 1.1179, "step": 31634 }, { "epoch": 0.86, "learning_rate": 9.553028698042255e-07, "loss": 1.302, "step": 31635 }, { "epoch": 0.86, "learning_rate": 9.549256293875985e-07, "loss": 1.1526, "step": 31636 }, { "epoch": 0.86, "learning_rate": 9.545484597353816e-07, "loss": 1.3201, "step": 31637 }, { "epoch": 0.86, "learning_rate": 9.541713608505244e-07, "loss": 1.4131, "step": 31638 }, { "epoch": 0.86, "learning_rate": 9.537943327359745e-07, "loss": 1.2278, "step": 31639 }, { "epoch": 0.86, "learning_rate": 9.534173753946851e-07, "loss": 1.3799, "step": 31640 }, { "epoch": 0.86, "learning_rate": 9.530404888296041e-07, "loss": 1.6895, "step": 31641 }, { "epoch": 0.86, "learning_rate": 9.526636730436823e-07, "loss": 1.197, "step": 31642 }, { "epoch": 0.86, "learning_rate": 9.522869280398627e-07, "loss": 1.1855, "step": 31643 }, { "epoch": 0.86, "learning_rate": 9.519102538210967e-07, "loss": 1.2756, "step": 31644 }, { "epoch": 0.86, "learning_rate": 9.515336503903294e-07, "loss": 1.2625, "step": 31645 }, { "epoch": 0.86, "learning_rate": 9.511571177505108e-07, "loss": 1.2656, "step": 31646 }, { "epoch": 0.86, "learning_rate": 9.507806559045807e-07, "loss": 1.283, "step": 31647 }, { "epoch": 0.86, "learning_rate": 9.504042648554889e-07, "loss": 1.1277, "step": 31648 }, { "epoch": 0.86, "learning_rate": 9.500279446061766e-07, "loss": 1.1531, "step": 31649 }, { "epoch": 0.86, "learning_rate": 9.496516951595947e-07, "loss": 1.2019, "step": 31650 }, { "epoch": 0.86, "learning_rate": 9.492755165186773e-07, "loss": 1.2466, "step": 31651 }, { "epoch": 0.86, "learning_rate": 9.488994086863757e-07, "loss": 1.4146, "step": 31652 }, { "epoch": 0.86, "learning_rate": 9.485233716656261e-07, "loss": 1.2734, "step": 31653 }, { "epoch": 0.86, "learning_rate": 9.481474054593754e-07, "loss": 1.3315, "step": 31654 }, { "epoch": 0.86, "learning_rate": 9.47771510070562e-07, "loss": 1.2368, "step": 31655 }, { "epoch": 0.86, "learning_rate": 9.473956855021271e-07, "loss": 1.2295, "step": 31656 }, { "epoch": 0.86, "learning_rate": 9.470199317570128e-07, "loss": 1.3042, "step": 31657 }, { "epoch": 0.86, "learning_rate": 9.466442488381578e-07, "loss": 1.2642, "step": 31658 }, { "epoch": 0.86, "learning_rate": 9.462686367485008e-07, "loss": 1.2844, "step": 31659 }, { "epoch": 0.86, "learning_rate": 9.458930954909795e-07, "loss": 1.2803, "step": 31660 }, { "epoch": 0.86, "learning_rate": 9.455176250685338e-07, "loss": 1.0903, "step": 31661 }, { "epoch": 0.86, "learning_rate": 9.451422254841014e-07, "loss": 1.342, "step": 31662 }, { "epoch": 0.86, "learning_rate": 9.447668967406176e-07, "loss": 1.3896, "step": 31663 }, { "epoch": 0.86, "learning_rate": 9.443916388410179e-07, "loss": 1.1801, "step": 31664 }, { "epoch": 0.86, "learning_rate": 9.440164517882422e-07, "loss": 1.1938, "step": 31665 }, { "epoch": 0.86, "learning_rate": 9.436413355852226e-07, "loss": 1.1768, "step": 31666 }, { "epoch": 0.86, "learning_rate": 9.432662902348944e-07, "loss": 1.3538, "step": 31667 }, { "epoch": 0.86, "learning_rate": 9.428913157401909e-07, "loss": 1.2693, "step": 31668 }, { "epoch": 0.86, "learning_rate": 9.425164121040487e-07, "loss": 1.3198, "step": 31669 }, { "epoch": 0.86, "learning_rate": 9.421415793293986e-07, "loss": 1.2729, "step": 31670 }, { "epoch": 0.86, "learning_rate": 9.417668174191707e-07, "loss": 1.2827, "step": 31671 }, { "epoch": 0.86, "learning_rate": 9.413921263763027e-07, "loss": 1.1785, "step": 31672 }, { "epoch": 0.86, "learning_rate": 9.41017506203723e-07, "loss": 1.6953, "step": 31673 }, { "epoch": 0.86, "learning_rate": 9.406429569043629e-07, "loss": 1.1809, "step": 31674 }, { "epoch": 0.87, "learning_rate": 9.4026847848115e-07, "loss": 1.1672, "step": 31675 }, { "epoch": 0.87, "learning_rate": 9.398940709370175e-07, "loss": 1.353, "step": 31676 }, { "epoch": 0.87, "learning_rate": 9.39519734274894e-07, "loss": 1.2986, "step": 31677 }, { "epoch": 0.87, "learning_rate": 9.391454684977075e-07, "loss": 1.1953, "step": 31678 }, { "epoch": 0.87, "learning_rate": 9.387712736083843e-07, "loss": 1.1895, "step": 31679 }, { "epoch": 0.87, "learning_rate": 9.383971496098565e-07, "loss": 1.3071, "step": 31680 }, { "epoch": 0.87, "learning_rate": 9.380230965050474e-07, "loss": 1.3738, "step": 31681 }, { "epoch": 0.87, "learning_rate": 9.376491142968846e-07, "loss": 1.2998, "step": 31682 }, { "epoch": 0.87, "learning_rate": 9.372752029882914e-07, "loss": 1.2759, "step": 31683 }, { "epoch": 0.87, "learning_rate": 9.369013625821977e-07, "loss": 1.3025, "step": 31684 }, { "epoch": 0.87, "learning_rate": 9.365275930815254e-07, "loss": 1.2432, "step": 31685 }, { "epoch": 0.87, "learning_rate": 9.361538944891979e-07, "loss": 1.1479, "step": 31686 }, { "epoch": 0.87, "learning_rate": 9.357802668081428e-07, "loss": 1.3335, "step": 31687 }, { "epoch": 0.87, "learning_rate": 9.354067100412778e-07, "loss": 1.1899, "step": 31688 }, { "epoch": 0.87, "learning_rate": 9.350332241915316e-07, "loss": 1.2976, "step": 31689 }, { "epoch": 0.87, "learning_rate": 9.346598092618197e-07, "loss": 1.1611, "step": 31690 }, { "epoch": 0.87, "learning_rate": 9.342864652550688e-07, "loss": 1.2993, "step": 31691 }, { "epoch": 0.87, "learning_rate": 9.33913192174195e-07, "loss": 1.1775, "step": 31692 }, { "epoch": 0.87, "learning_rate": 9.335399900221254e-07, "loss": 1.2424, "step": 31693 }, { "epoch": 0.87, "learning_rate": 9.331668588017717e-07, "loss": 1.2969, "step": 31694 }, { "epoch": 0.87, "learning_rate": 9.327937985160595e-07, "loss": 1.4009, "step": 31695 }, { "epoch": 0.87, "learning_rate": 9.324208091679021e-07, "loss": 1.1995, "step": 31696 }, { "epoch": 0.87, "learning_rate": 9.320478907602249e-07, "loss": 1.1646, "step": 31697 }, { "epoch": 0.87, "learning_rate": 9.316750432959365e-07, "loss": 1.3069, "step": 31698 }, { "epoch": 0.87, "learning_rate": 9.313022667779603e-07, "loss": 0.9316, "step": 31699 }, { "epoch": 0.87, "learning_rate": 9.309295612092095e-07, "loss": 1.3125, "step": 31700 }, { "epoch": 0.87, "learning_rate": 9.305569265926018e-07, "loss": 1.1863, "step": 31701 }, { "epoch": 0.87, "learning_rate": 9.301843629310537e-07, "loss": 1.2278, "step": 31702 }, { "epoch": 0.87, "learning_rate": 9.29811870227475e-07, "loss": 1.3467, "step": 31703 }, { "epoch": 0.87, "learning_rate": 9.294394484847858e-07, "loss": 1.2593, "step": 31704 }, { "epoch": 0.87, "learning_rate": 9.290670977058968e-07, "loss": 1.2085, "step": 31705 }, { "epoch": 0.87, "learning_rate": 9.286948178937217e-07, "loss": 1.1887, "step": 31706 }, { "epoch": 0.87, "learning_rate": 9.283226090511699e-07, "loss": 1.2629, "step": 31707 }, { "epoch": 0.87, "learning_rate": 9.279504711811582e-07, "loss": 1.2952, "step": 31708 }, { "epoch": 0.87, "learning_rate": 9.275784042865965e-07, "loss": 1.2637, "step": 31709 }, { "epoch": 0.87, "learning_rate": 9.272064083703958e-07, "loss": 1.3279, "step": 31710 }, { "epoch": 0.87, "learning_rate": 9.268344834354637e-07, "loss": 1.355, "step": 31711 }, { "epoch": 0.87, "learning_rate": 9.264626294847134e-07, "loss": 1.0991, "step": 31712 }, { "epoch": 0.87, "learning_rate": 9.260908465210528e-07, "loss": 1.3435, "step": 31713 }, { "epoch": 0.87, "learning_rate": 9.257191345473904e-07, "loss": 1.0969, "step": 31714 }, { "epoch": 0.87, "learning_rate": 9.25347493566634e-07, "loss": 1.2844, "step": 31715 }, { "epoch": 0.87, "learning_rate": 9.249759235816924e-07, "loss": 1.3877, "step": 31716 }, { "epoch": 0.87, "learning_rate": 9.246044245954711e-07, "loss": 1.2861, "step": 31717 }, { "epoch": 0.87, "learning_rate": 9.242329966108765e-07, "loss": 1.3367, "step": 31718 }, { "epoch": 0.87, "learning_rate": 9.238616396308164e-07, "loss": 1.2839, "step": 31719 }, { "epoch": 0.87, "learning_rate": 9.234903536581952e-07, "loss": 1.2422, "step": 31720 }, { "epoch": 0.87, "learning_rate": 9.231191386959182e-07, "loss": 1.2771, "step": 31721 }, { "epoch": 0.87, "learning_rate": 9.227479947468854e-07, "loss": 1.1926, "step": 31722 }, { "epoch": 0.87, "learning_rate": 9.223769218140066e-07, "loss": 1.2117, "step": 31723 }, { "epoch": 0.87, "learning_rate": 9.22005919900183e-07, "loss": 1.2803, "step": 31724 }, { "epoch": 0.87, "learning_rate": 9.216349890083154e-07, "loss": 1.2983, "step": 31725 }, { "epoch": 0.87, "learning_rate": 9.212641291413038e-07, "loss": 1.3564, "step": 31726 }, { "epoch": 0.87, "learning_rate": 9.208933403020559e-07, "loss": 1.3667, "step": 31727 }, { "epoch": 0.87, "learning_rate": 9.205226224934693e-07, "loss": 1.0579, "step": 31728 }, { "epoch": 0.87, "learning_rate": 9.201519757184429e-07, "loss": 1.3286, "step": 31729 }, { "epoch": 0.87, "learning_rate": 9.197813999798766e-07, "loss": 1.156, "step": 31730 }, { "epoch": 0.87, "learning_rate": 9.194108952806735e-07, "loss": 1.7065, "step": 31731 }, { "epoch": 0.87, "learning_rate": 9.190404616237281e-07, "loss": 1.2241, "step": 31732 }, { "epoch": 0.87, "learning_rate": 9.186700990119391e-07, "loss": 1.2703, "step": 31733 }, { "epoch": 0.87, "learning_rate": 9.182998074482063e-07, "loss": 1.2654, "step": 31734 }, { "epoch": 0.87, "learning_rate": 9.179295869354243e-07, "loss": 1.2136, "step": 31735 }, { "epoch": 0.87, "learning_rate": 9.175594374764929e-07, "loss": 1.3123, "step": 31736 }, { "epoch": 0.87, "learning_rate": 9.17189359074303e-07, "loss": 1.3135, "step": 31737 }, { "epoch": 0.87, "learning_rate": 9.168193517317536e-07, "loss": 1.3267, "step": 31738 }, { "epoch": 0.87, "learning_rate": 9.164494154517367e-07, "loss": 1.3396, "step": 31739 }, { "epoch": 0.87, "learning_rate": 9.160795502371522e-07, "loss": 1.2271, "step": 31740 }, { "epoch": 0.87, "learning_rate": 9.157097560908867e-07, "loss": 1.3127, "step": 31741 }, { "epoch": 0.87, "learning_rate": 9.153400330158369e-07, "loss": 1.2263, "step": 31742 }, { "epoch": 0.87, "learning_rate": 9.149703810148935e-07, "loss": 1.2327, "step": 31743 }, { "epoch": 0.87, "learning_rate": 9.146008000909534e-07, "loss": 1.2688, "step": 31744 }, { "epoch": 0.87, "learning_rate": 9.142312902469009e-07, "loss": 1.3933, "step": 31745 }, { "epoch": 0.87, "learning_rate": 9.138618514856312e-07, "loss": 1.3145, "step": 31746 }, { "epoch": 0.87, "learning_rate": 9.134924838100335e-07, "loss": 0.9988, "step": 31747 }, { "epoch": 0.87, "learning_rate": 9.131231872229984e-07, "loss": 1.2158, "step": 31748 }, { "epoch": 0.87, "learning_rate": 9.12753961727415e-07, "loss": 1.2024, "step": 31749 }, { "epoch": 0.87, "learning_rate": 9.123848073261698e-07, "loss": 1.2456, "step": 31750 }, { "epoch": 0.87, "learning_rate": 9.120157240221539e-07, "loss": 1.1511, "step": 31751 }, { "epoch": 0.87, "learning_rate": 9.116467118182538e-07, "loss": 1.1144, "step": 31752 }, { "epoch": 0.87, "learning_rate": 9.112777707173559e-07, "loss": 1.2292, "step": 31753 }, { "epoch": 0.87, "learning_rate": 9.109089007223459e-07, "loss": 1.3364, "step": 31754 }, { "epoch": 0.87, "learning_rate": 9.105401018361115e-07, "loss": 1.2964, "step": 31755 }, { "epoch": 0.87, "learning_rate": 9.101713740615381e-07, "loss": 1.1357, "step": 31756 }, { "epoch": 0.87, "learning_rate": 9.098027174015089e-07, "loss": 1.6758, "step": 31757 }, { "epoch": 0.87, "learning_rate": 9.094341318589073e-07, "loss": 1.1943, "step": 31758 }, { "epoch": 0.87, "learning_rate": 9.090656174366197e-07, "loss": 1.3765, "step": 31759 }, { "epoch": 0.87, "learning_rate": 9.086971741375283e-07, "loss": 1.3447, "step": 31760 }, { "epoch": 0.87, "learning_rate": 9.083288019645154e-07, "loss": 1.2771, "step": 31761 }, { "epoch": 0.87, "learning_rate": 9.079605009204606e-07, "loss": 1.2192, "step": 31762 }, { "epoch": 0.87, "learning_rate": 9.075922710082485e-07, "loss": 1.3467, "step": 31763 }, { "epoch": 0.87, "learning_rate": 9.072241122307601e-07, "loss": 1.2451, "step": 31764 }, { "epoch": 0.87, "learning_rate": 9.06856024590872e-07, "loss": 1.4092, "step": 31765 }, { "epoch": 0.87, "learning_rate": 9.064880080914684e-07, "loss": 1.3369, "step": 31766 }, { "epoch": 0.87, "learning_rate": 9.061200627354272e-07, "loss": 1.282, "step": 31767 }, { "epoch": 0.87, "learning_rate": 9.057521885256259e-07, "loss": 1.2407, "step": 31768 }, { "epoch": 0.87, "learning_rate": 9.053843854649413e-07, "loss": 1.1907, "step": 31769 }, { "epoch": 0.87, "learning_rate": 9.050166535562543e-07, "loss": 1.1699, "step": 31770 }, { "epoch": 0.87, "learning_rate": 9.046489928024404e-07, "loss": 1.3535, "step": 31771 }, { "epoch": 0.87, "learning_rate": 9.042814032063762e-07, "loss": 1.2297, "step": 31772 }, { "epoch": 0.87, "learning_rate": 9.03913884770935e-07, "loss": 1.3237, "step": 31773 }, { "epoch": 0.87, "learning_rate": 9.035464374989955e-07, "loss": 1.2073, "step": 31774 }, { "epoch": 0.87, "learning_rate": 9.031790613934321e-07, "loss": 1.1709, "step": 31775 }, { "epoch": 0.87, "learning_rate": 9.028117564571182e-07, "loss": 1.3137, "step": 31776 }, { "epoch": 0.87, "learning_rate": 9.024445226929246e-07, "loss": 1.3357, "step": 31777 }, { "epoch": 0.87, "learning_rate": 9.02077360103728e-07, "loss": 1.2998, "step": 31778 }, { "epoch": 0.87, "learning_rate": 9.017102686924028e-07, "loss": 1.1677, "step": 31779 }, { "epoch": 0.87, "learning_rate": 9.013432484618146e-07, "loss": 1.4028, "step": 31780 }, { "epoch": 0.87, "learning_rate": 9.009762994148408e-07, "loss": 1.1943, "step": 31781 }, { "epoch": 0.87, "learning_rate": 9.006094215543482e-07, "loss": 1.3887, "step": 31782 }, { "epoch": 0.87, "learning_rate": 9.002426148832111e-07, "loss": 1.2554, "step": 31783 }, { "epoch": 0.87, "learning_rate": 8.998758794042939e-07, "loss": 1.2126, "step": 31784 }, { "epoch": 0.87, "learning_rate": 8.995092151204699e-07, "loss": 1.1895, "step": 31785 }, { "epoch": 0.87, "learning_rate": 8.991426220346056e-07, "loss": 1.7349, "step": 31786 }, { "epoch": 0.87, "learning_rate": 8.987761001495732e-07, "loss": 1.2092, "step": 31787 }, { "epoch": 0.87, "learning_rate": 8.984096494682326e-07, "loss": 1.3484, "step": 31788 }, { "epoch": 0.87, "learning_rate": 8.980432699934572e-07, "loss": 1.2354, "step": 31789 }, { "epoch": 0.87, "learning_rate": 8.9767696172811e-07, "loss": 1.2969, "step": 31790 }, { "epoch": 0.87, "learning_rate": 8.973107246750612e-07, "loss": 1.2598, "step": 31791 }, { "epoch": 0.87, "learning_rate": 8.969445588371684e-07, "loss": 1.2075, "step": 31792 }, { "epoch": 0.87, "learning_rate": 8.965784642173037e-07, "loss": 1.2073, "step": 31793 }, { "epoch": 0.87, "learning_rate": 8.96212440818327e-07, "loss": 1.1023, "step": 31794 }, { "epoch": 0.87, "learning_rate": 8.95846488643104e-07, "loss": 1.2881, "step": 31795 }, { "epoch": 0.87, "learning_rate": 8.954806076944978e-07, "loss": 1.2852, "step": 31796 }, { "epoch": 0.87, "learning_rate": 8.951147979753671e-07, "loss": 1.0377, "step": 31797 }, { "epoch": 0.87, "learning_rate": 8.947490594885799e-07, "loss": 1.2705, "step": 31798 }, { "epoch": 0.87, "learning_rate": 8.943833922369937e-07, "loss": 1.2889, "step": 31799 }, { "epoch": 0.87, "learning_rate": 8.940177962234708e-07, "loss": 1.3215, "step": 31800 }, { "epoch": 0.87, "learning_rate": 8.936522714508678e-07, "loss": 1.3564, "step": 31801 }, { "epoch": 0.87, "learning_rate": 8.932868179220499e-07, "loss": 1.27, "step": 31802 }, { "epoch": 0.87, "learning_rate": 8.929214356398741e-07, "loss": 1.1385, "step": 31803 }, { "epoch": 0.87, "learning_rate": 8.925561246071979e-07, "loss": 1.2478, "step": 31804 }, { "epoch": 0.87, "learning_rate": 8.921908848268779e-07, "loss": 1.2581, "step": 31805 }, { "epoch": 0.87, "learning_rate": 8.918257163017752e-07, "loss": 1.3457, "step": 31806 }, { "epoch": 0.87, "learning_rate": 8.914606190347464e-07, "loss": 1.313, "step": 31807 }, { "epoch": 0.87, "learning_rate": 8.910955930286458e-07, "loss": 1.178, "step": 31808 }, { "epoch": 0.87, "learning_rate": 8.907306382863279e-07, "loss": 1.3433, "step": 31809 }, { "epoch": 0.87, "learning_rate": 8.903657548106526e-07, "loss": 1.2002, "step": 31810 }, { "epoch": 0.87, "learning_rate": 8.900009426044709e-07, "loss": 1.2451, "step": 31811 }, { "epoch": 0.87, "learning_rate": 8.896362016706372e-07, "loss": 1.093, "step": 31812 }, { "epoch": 0.87, "learning_rate": 8.892715320120071e-07, "loss": 1.2009, "step": 31813 }, { "epoch": 0.87, "learning_rate": 8.889069336314327e-07, "loss": 1.2061, "step": 31814 }, { "epoch": 0.87, "learning_rate": 8.88542406531766e-07, "loss": 1.2996, "step": 31815 }, { "epoch": 0.87, "learning_rate": 8.881779507158572e-07, "loss": 1.1748, "step": 31816 }, { "epoch": 0.87, "learning_rate": 8.878135661865606e-07, "loss": 0.9546, "step": 31817 }, { "epoch": 0.87, "learning_rate": 8.874492529467271e-07, "loss": 1.2695, "step": 31818 }, { "epoch": 0.87, "learning_rate": 8.870850109992046e-07, "loss": 1.239, "step": 31819 }, { "epoch": 0.87, "learning_rate": 8.867208403468419e-07, "loss": 1.3284, "step": 31820 }, { "epoch": 0.87, "learning_rate": 8.863567409924922e-07, "loss": 1.2117, "step": 31821 }, { "epoch": 0.87, "learning_rate": 8.859927129390022e-07, "loss": 1.1436, "step": 31822 }, { "epoch": 0.87, "learning_rate": 8.856287561892196e-07, "loss": 1.1663, "step": 31823 }, { "epoch": 0.87, "learning_rate": 8.852648707459888e-07, "loss": 1.312, "step": 31824 }, { "epoch": 0.87, "learning_rate": 8.849010566121608e-07, "loss": 1.3936, "step": 31825 }, { "epoch": 0.87, "learning_rate": 8.845373137905833e-07, "loss": 1.2856, "step": 31826 }, { "epoch": 0.87, "learning_rate": 8.841736422840963e-07, "loss": 1.3618, "step": 31827 }, { "epoch": 0.87, "learning_rate": 8.838100420955498e-07, "loss": 1.6851, "step": 31828 }, { "epoch": 0.87, "learning_rate": 8.834465132277858e-07, "loss": 1.3435, "step": 31829 }, { "epoch": 0.87, "learning_rate": 8.830830556836523e-07, "loss": 1.3455, "step": 31830 }, { "epoch": 0.87, "learning_rate": 8.827196694659867e-07, "loss": 1.3896, "step": 31831 }, { "epoch": 0.87, "learning_rate": 8.823563545776359e-07, "loss": 1.2305, "step": 31832 }, { "epoch": 0.87, "learning_rate": 8.819931110214408e-07, "loss": 1.2415, "step": 31833 }, { "epoch": 0.87, "learning_rate": 8.816299388002458e-07, "loss": 1.2563, "step": 31834 }, { "epoch": 0.87, "learning_rate": 8.812668379168898e-07, "loss": 1.1389, "step": 31835 }, { "epoch": 0.87, "learning_rate": 8.80903808374215e-07, "loss": 1.3167, "step": 31836 }, { "epoch": 0.87, "learning_rate": 8.805408501750578e-07, "loss": 1.2241, "step": 31837 }, { "epoch": 0.87, "learning_rate": 8.80177963322263e-07, "loss": 1.3069, "step": 31838 }, { "epoch": 0.87, "learning_rate": 8.798151478186678e-07, "loss": 1.2947, "step": 31839 }, { "epoch": 0.87, "learning_rate": 8.794524036671082e-07, "loss": 1.2856, "step": 31840 }, { "epoch": 0.87, "learning_rate": 8.790897308704261e-07, "loss": 1.3362, "step": 31841 }, { "epoch": 0.87, "learning_rate": 8.787271294314559e-07, "loss": 1.301, "step": 31842 }, { "epoch": 0.87, "learning_rate": 8.783645993530365e-07, "loss": 1.2393, "step": 31843 }, { "epoch": 0.87, "learning_rate": 8.780021406380012e-07, "loss": 1.3481, "step": 31844 }, { "epoch": 0.87, "learning_rate": 8.7763975328919e-07, "loss": 1.3049, "step": 31845 }, { "epoch": 0.87, "learning_rate": 8.772774373094351e-07, "loss": 1.27, "step": 31846 }, { "epoch": 0.87, "learning_rate": 8.769151927015717e-07, "loss": 1.3125, "step": 31847 }, { "epoch": 0.87, "learning_rate": 8.765530194684325e-07, "loss": 1.2927, "step": 31848 }, { "epoch": 0.87, "learning_rate": 8.761909176128536e-07, "loss": 1.2173, "step": 31849 }, { "epoch": 0.87, "learning_rate": 8.758288871376674e-07, "loss": 1.1602, "step": 31850 }, { "epoch": 0.87, "learning_rate": 8.754669280457051e-07, "loss": 1.3105, "step": 31851 }, { "epoch": 0.87, "learning_rate": 8.751050403397976e-07, "loss": 1.2683, "step": 31852 }, { "epoch": 0.87, "learning_rate": 8.747432240227783e-07, "loss": 1.0308, "step": 31853 }, { "epoch": 0.87, "learning_rate": 8.74381479097477e-07, "loss": 1.2788, "step": 31854 }, { "epoch": 0.87, "learning_rate": 8.740198055667248e-07, "loss": 1.2295, "step": 31855 }, { "epoch": 0.87, "learning_rate": 8.736582034333473e-07, "loss": 1.1646, "step": 31856 }, { "epoch": 0.87, "learning_rate": 8.73296672700179e-07, "loss": 1.1194, "step": 31857 }, { "epoch": 0.87, "learning_rate": 8.729352133700463e-07, "loss": 1.2278, "step": 31858 }, { "epoch": 0.87, "learning_rate": 8.725738254457739e-07, "loss": 1.3174, "step": 31859 }, { "epoch": 0.87, "learning_rate": 8.722125089301947e-07, "loss": 1.2791, "step": 31860 }, { "epoch": 0.87, "learning_rate": 8.718512638261323e-07, "loss": 1.1843, "step": 31861 }, { "epoch": 0.87, "learning_rate": 8.714900901364132e-07, "loss": 1.2864, "step": 31862 }, { "epoch": 0.87, "learning_rate": 8.711289878638607e-07, "loss": 1.2358, "step": 31863 }, { "epoch": 0.87, "learning_rate": 8.707679570113048e-07, "loss": 1.1646, "step": 31864 }, { "epoch": 0.87, "learning_rate": 8.704069975815654e-07, "loss": 1.2151, "step": 31865 }, { "epoch": 0.87, "learning_rate": 8.700461095774726e-07, "loss": 1.4314, "step": 31866 }, { "epoch": 0.87, "learning_rate": 8.696852930018418e-07, "loss": 1.2776, "step": 31867 }, { "epoch": 0.87, "learning_rate": 8.693245478575018e-07, "loss": 1.3318, "step": 31868 }, { "epoch": 0.87, "learning_rate": 8.689638741472705e-07, "loss": 1.1824, "step": 31869 }, { "epoch": 0.87, "learning_rate": 8.686032718739768e-07, "loss": 1.4182, "step": 31870 }, { "epoch": 0.87, "learning_rate": 8.682427410404337e-07, "loss": 1.1737, "step": 31871 }, { "epoch": 0.87, "learning_rate": 8.678822816494647e-07, "loss": 1.3899, "step": 31872 }, { "epoch": 0.87, "learning_rate": 8.675218937038921e-07, "loss": 1.2219, "step": 31873 }, { "epoch": 0.87, "learning_rate": 8.671615772065345e-07, "loss": 1.304, "step": 31874 }, { "epoch": 0.87, "learning_rate": 8.668013321602098e-07, "loss": 1.3826, "step": 31875 }, { "epoch": 0.87, "learning_rate": 8.664411585677346e-07, "loss": 0.9922, "step": 31876 }, { "epoch": 0.87, "learning_rate": 8.660810564319311e-07, "loss": 1.3533, "step": 31877 }, { "epoch": 0.87, "learning_rate": 8.657210257556148e-07, "loss": 1.1746, "step": 31878 }, { "epoch": 0.87, "learning_rate": 8.653610665416012e-07, "loss": 1.1682, "step": 31879 }, { "epoch": 0.87, "learning_rate": 8.65001178792706e-07, "loss": 1.769, "step": 31880 }, { "epoch": 0.87, "learning_rate": 8.646413625117478e-07, "loss": 1.3472, "step": 31881 }, { "epoch": 0.87, "learning_rate": 8.64281617701539e-07, "loss": 1.1975, "step": 31882 }, { "epoch": 0.87, "learning_rate": 8.639219443648961e-07, "loss": 1.2766, "step": 31883 }, { "epoch": 0.87, "learning_rate": 8.635623425046292e-07, "loss": 1.2661, "step": 31884 }, { "epoch": 0.87, "learning_rate": 8.632028121235558e-07, "loss": 1.384, "step": 31885 }, { "epoch": 0.87, "learning_rate": 8.628433532244873e-07, "loss": 1.1909, "step": 31886 }, { "epoch": 0.87, "learning_rate": 8.624839658102346e-07, "loss": 1.2246, "step": 31887 }, { "epoch": 0.87, "learning_rate": 8.621246498836122e-07, "loss": 1.078, "step": 31888 }, { "epoch": 0.87, "learning_rate": 8.6176540544743e-07, "loss": 1.3904, "step": 31889 }, { "epoch": 0.87, "learning_rate": 8.614062325044969e-07, "loss": 1.3545, "step": 31890 }, { "epoch": 0.87, "learning_rate": 8.61047131057624e-07, "loss": 1.1914, "step": 31891 }, { "epoch": 0.87, "learning_rate": 8.606881011096213e-07, "loss": 1.3376, "step": 31892 }, { "epoch": 0.87, "learning_rate": 8.603291426632976e-07, "loss": 1.3577, "step": 31893 }, { "epoch": 0.87, "learning_rate": 8.599702557214617e-07, "loss": 1.2932, "step": 31894 }, { "epoch": 0.87, "learning_rate": 8.596114402869182e-07, "loss": 1.3176, "step": 31895 }, { "epoch": 0.87, "learning_rate": 8.592526963624781e-07, "loss": 1.2283, "step": 31896 }, { "epoch": 0.87, "learning_rate": 8.58894023950948e-07, "loss": 1.2817, "step": 31897 }, { "epoch": 0.87, "learning_rate": 8.585354230551312e-07, "loss": 1.3499, "step": 31898 }, { "epoch": 0.87, "learning_rate": 8.581768936778334e-07, "loss": 1.3296, "step": 31899 }, { "epoch": 0.87, "learning_rate": 8.578184358218622e-07, "loss": 1.1609, "step": 31900 }, { "epoch": 0.87, "learning_rate": 8.574600494900209e-07, "loss": 1.1726, "step": 31901 }, { "epoch": 0.87, "learning_rate": 8.571017346851119e-07, "loss": 1.2825, "step": 31902 }, { "epoch": 0.87, "learning_rate": 8.567434914099404e-07, "loss": 1.0775, "step": 31903 }, { "epoch": 0.87, "learning_rate": 8.563853196673066e-07, "loss": 1.0591, "step": 31904 }, { "epoch": 0.87, "learning_rate": 8.560272194600183e-07, "loss": 1.1758, "step": 31905 }, { "epoch": 0.87, "learning_rate": 8.556691907908699e-07, "loss": 1.2598, "step": 31906 }, { "epoch": 0.87, "learning_rate": 8.553112336626678e-07, "loss": 1.645, "step": 31907 }, { "epoch": 0.87, "learning_rate": 8.54953348078208e-07, "loss": 1.0637, "step": 31908 }, { "epoch": 0.87, "learning_rate": 8.545955340402967e-07, "loss": 1.2427, "step": 31909 }, { "epoch": 0.87, "learning_rate": 8.542377915517253e-07, "loss": 1.2417, "step": 31910 }, { "epoch": 0.87, "learning_rate": 8.538801206152991e-07, "loss": 1.3394, "step": 31911 }, { "epoch": 0.87, "learning_rate": 8.535225212338128e-07, "loss": 1.1218, "step": 31912 }, { "epoch": 0.87, "learning_rate": 8.531649934100683e-07, "loss": 1.2708, "step": 31913 }, { "epoch": 0.87, "learning_rate": 8.528075371468569e-07, "loss": 1.3225, "step": 31914 }, { "epoch": 0.87, "learning_rate": 8.524501524469786e-07, "loss": 1.3086, "step": 31915 }, { "epoch": 0.87, "learning_rate": 8.520928393132277e-07, "loss": 1.2603, "step": 31916 }, { "epoch": 0.87, "learning_rate": 8.517355977484043e-07, "loss": 1.293, "step": 31917 }, { "epoch": 0.87, "learning_rate": 8.513784277552961e-07, "loss": 1.2959, "step": 31918 }, { "epoch": 0.87, "learning_rate": 8.51021329336702e-07, "loss": 1.2622, "step": 31919 }, { "epoch": 0.87, "learning_rate": 8.506643024954153e-07, "loss": 1.3755, "step": 31920 }, { "epoch": 0.87, "learning_rate": 8.503073472342294e-07, "loss": 1.1558, "step": 31921 }, { "epoch": 0.87, "learning_rate": 8.499504635559363e-07, "loss": 1.2368, "step": 31922 }, { "epoch": 0.87, "learning_rate": 8.495936514633263e-07, "loss": 1.1438, "step": 31923 }, { "epoch": 0.87, "learning_rate": 8.492369109591947e-07, "loss": 1.2471, "step": 31924 }, { "epoch": 0.87, "learning_rate": 8.488802420463304e-07, "loss": 1.1069, "step": 31925 }, { "epoch": 0.87, "learning_rate": 8.485236447275236e-07, "loss": 1.2544, "step": 31926 }, { "epoch": 0.87, "learning_rate": 8.481671190055629e-07, "loss": 1.0388, "step": 31927 }, { "epoch": 0.87, "learning_rate": 8.478106648832407e-07, "loss": 1.3098, "step": 31928 }, { "epoch": 0.87, "learning_rate": 8.474542823633447e-07, "loss": 1.3772, "step": 31929 }, { "epoch": 0.87, "learning_rate": 8.470979714486627e-07, "loss": 1.2234, "step": 31930 }, { "epoch": 0.87, "learning_rate": 8.467417321419801e-07, "loss": 1.1592, "step": 31931 }, { "epoch": 0.87, "learning_rate": 8.463855644460873e-07, "loss": 1.2788, "step": 31932 }, { "epoch": 0.87, "learning_rate": 8.460294683637705e-07, "loss": 1.1533, "step": 31933 }, { "epoch": 0.87, "learning_rate": 8.456734438978121e-07, "loss": 1.1145, "step": 31934 }, { "epoch": 0.87, "learning_rate": 8.45317491051002e-07, "loss": 1.3728, "step": 31935 }, { "epoch": 0.87, "learning_rate": 8.449616098261226e-07, "loss": 1.3713, "step": 31936 }, { "epoch": 0.87, "learning_rate": 8.446058002259594e-07, "loss": 1.334, "step": 31937 }, { "epoch": 0.87, "learning_rate": 8.442500622532935e-07, "loss": 1.2732, "step": 31938 }, { "epoch": 0.87, "learning_rate": 8.438943959109102e-07, "loss": 1.3179, "step": 31939 }, { "epoch": 0.87, "learning_rate": 8.435388012015933e-07, "loss": 1.2424, "step": 31940 }, { "epoch": 0.87, "learning_rate": 8.431832781281224e-07, "loss": 1.2466, "step": 31941 }, { "epoch": 0.87, "learning_rate": 8.428278266932777e-07, "loss": 1.2966, "step": 31942 }, { "epoch": 0.87, "learning_rate": 8.424724468998435e-07, "loss": 1.2139, "step": 31943 }, { "epoch": 0.87, "learning_rate": 8.421171387506e-07, "loss": 1.3562, "step": 31944 }, { "epoch": 0.87, "learning_rate": 8.417619022483248e-07, "loss": 1.3254, "step": 31945 }, { "epoch": 0.87, "learning_rate": 8.414067373957968e-07, "loss": 1.2573, "step": 31946 }, { "epoch": 0.87, "learning_rate": 8.410516441957961e-07, "loss": 1.1895, "step": 31947 }, { "epoch": 0.87, "learning_rate": 8.406966226511015e-07, "loss": 1.3145, "step": 31948 }, { "epoch": 0.87, "learning_rate": 8.403416727644886e-07, "loss": 0.991, "step": 31949 }, { "epoch": 0.87, "learning_rate": 8.399867945387363e-07, "loss": 1.3503, "step": 31950 }, { "epoch": 0.87, "learning_rate": 8.396319879766179e-07, "loss": 1.0488, "step": 31951 }, { "epoch": 0.87, "learning_rate": 8.392772530809145e-07, "loss": 1.2712, "step": 31952 }, { "epoch": 0.87, "learning_rate": 8.389225898543962e-07, "loss": 1.1482, "step": 31953 }, { "epoch": 0.87, "learning_rate": 8.385679982998396e-07, "loss": 1.3638, "step": 31954 }, { "epoch": 0.87, "learning_rate": 8.382134784200191e-07, "loss": 1.2744, "step": 31955 }, { "epoch": 0.87, "learning_rate": 8.378590302177103e-07, "loss": 1.3955, "step": 31956 }, { "epoch": 0.87, "learning_rate": 8.37504653695681e-07, "loss": 1.291, "step": 31957 }, { "epoch": 0.87, "learning_rate": 8.37150348856709e-07, "loss": 1.1538, "step": 31958 }, { "epoch": 0.87, "learning_rate": 8.367961157035609e-07, "loss": 1.0654, "step": 31959 }, { "epoch": 0.87, "learning_rate": 8.364419542390156e-07, "loss": 1.2036, "step": 31960 }, { "epoch": 0.87, "learning_rate": 8.360878644658365e-07, "loss": 1.2683, "step": 31961 }, { "epoch": 0.87, "learning_rate": 8.357338463867981e-07, "loss": 1.2242, "step": 31962 }, { "epoch": 0.87, "learning_rate": 8.35379900004667e-07, "loss": 1.7222, "step": 31963 }, { "epoch": 0.87, "learning_rate": 8.350260253222154e-07, "loss": 1.0244, "step": 31964 }, { "epoch": 0.87, "learning_rate": 8.3467222234221e-07, "loss": 1.2073, "step": 31965 }, { "epoch": 0.87, "learning_rate": 8.343184910674185e-07, "loss": 1.188, "step": 31966 }, { "epoch": 0.87, "learning_rate": 8.339648315006111e-07, "loss": 1.6521, "step": 31967 }, { "epoch": 0.87, "learning_rate": 8.33611243644552e-07, "loss": 1.3313, "step": 31968 }, { "epoch": 0.87, "learning_rate": 8.332577275020082e-07, "loss": 1.3147, "step": 31969 }, { "epoch": 0.87, "learning_rate": 8.329042830757439e-07, "loss": 1.2876, "step": 31970 }, { "epoch": 0.87, "learning_rate": 8.32550910368528e-07, "loss": 1.1482, "step": 31971 }, { "epoch": 0.87, "learning_rate": 8.321976093831219e-07, "loss": 1.3298, "step": 31972 }, { "epoch": 0.87, "learning_rate": 8.318443801222919e-07, "loss": 1.302, "step": 31973 }, { "epoch": 0.87, "learning_rate": 8.314912225887972e-07, "loss": 1.1655, "step": 31974 }, { "epoch": 0.87, "learning_rate": 8.311381367854066e-07, "loss": 1.2017, "step": 31975 }, { "epoch": 0.87, "learning_rate": 8.3078512271488e-07, "loss": 1.2185, "step": 31976 }, { "epoch": 0.87, "learning_rate": 8.304321803799786e-07, "loss": 1.2964, "step": 31977 }, { "epoch": 0.87, "learning_rate": 8.300793097834614e-07, "loss": 1.2708, "step": 31978 }, { "epoch": 0.87, "learning_rate": 8.297265109280939e-07, "loss": 1.2983, "step": 31979 }, { "epoch": 0.87, "learning_rate": 8.293737838166349e-07, "loss": 1.2476, "step": 31980 }, { "epoch": 0.87, "learning_rate": 8.290211284518401e-07, "loss": 1.2146, "step": 31981 }, { "epoch": 0.87, "learning_rate": 8.28668544836474e-07, "loss": 1.3608, "step": 31982 }, { "epoch": 0.87, "learning_rate": 8.28316032973292e-07, "loss": 1.2344, "step": 31983 }, { "epoch": 0.87, "learning_rate": 8.279635928650532e-07, "loss": 1.3313, "step": 31984 }, { "epoch": 0.87, "learning_rate": 8.276112245145118e-07, "loss": 1.1968, "step": 31985 }, { "epoch": 0.87, "learning_rate": 8.272589279244292e-07, "loss": 1.4026, "step": 31986 }, { "epoch": 0.87, "learning_rate": 8.269067030975597e-07, "loss": 1.2073, "step": 31987 }, { "epoch": 0.87, "learning_rate": 8.265545500366578e-07, "loss": 1.1338, "step": 31988 }, { "epoch": 0.87, "learning_rate": 8.262024687444781e-07, "loss": 1.3582, "step": 31989 }, { "epoch": 0.87, "learning_rate": 8.258504592237781e-07, "loss": 1.3652, "step": 31990 }, { "epoch": 0.87, "learning_rate": 8.254985214773104e-07, "loss": 1.0476, "step": 31991 }, { "epoch": 0.87, "learning_rate": 8.25146655507828e-07, "loss": 1.1875, "step": 31992 }, { "epoch": 0.87, "learning_rate": 8.247948613180823e-07, "loss": 1.2668, "step": 31993 }, { "epoch": 0.87, "learning_rate": 8.244431389108287e-07, "loss": 1.188, "step": 31994 }, { "epoch": 0.87, "learning_rate": 8.240914882888174e-07, "loss": 1.2529, "step": 31995 }, { "epoch": 0.87, "learning_rate": 8.237399094547982e-07, "loss": 1.2456, "step": 31996 }, { "epoch": 0.87, "learning_rate": 8.233884024115235e-07, "loss": 1.189, "step": 31997 }, { "epoch": 0.87, "learning_rate": 8.230369671617422e-07, "loss": 1.3198, "step": 31998 }, { "epoch": 0.87, "learning_rate": 8.226856037082076e-07, "loss": 1.1172, "step": 31999 }, { "epoch": 0.87, "learning_rate": 8.223343120536609e-07, "loss": 1.167, "step": 32000 }, { "epoch": 0.87, "learning_rate": 8.219830922008576e-07, "loss": 1.1365, "step": 32001 }, { "epoch": 0.87, "learning_rate": 8.216319441525411e-07, "loss": 1.1274, "step": 32002 }, { "epoch": 0.87, "learning_rate": 8.212808679114637e-07, "loss": 1.2671, "step": 32003 }, { "epoch": 0.87, "learning_rate": 8.209298634803642e-07, "loss": 1.2595, "step": 32004 }, { "epoch": 0.87, "learning_rate": 8.20578930861996e-07, "loss": 1.3369, "step": 32005 }, { "epoch": 0.87, "learning_rate": 8.202280700590993e-07, "loss": 1.4014, "step": 32006 }, { "epoch": 0.87, "learning_rate": 8.19877281074426e-07, "loss": 1.26, "step": 32007 }, { "epoch": 0.87, "learning_rate": 8.19526563910712e-07, "loss": 1.3162, "step": 32008 }, { "epoch": 0.87, "learning_rate": 8.191759185707071e-07, "loss": 1.2205, "step": 32009 }, { "epoch": 0.87, "learning_rate": 8.188253450571504e-07, "loss": 1.1609, "step": 32010 }, { "epoch": 0.87, "learning_rate": 8.184748433727885e-07, "loss": 1.2305, "step": 32011 }, { "epoch": 0.87, "learning_rate": 8.181244135203625e-07, "loss": 1.1774, "step": 32012 }, { "epoch": 0.87, "learning_rate": 8.177740555026126e-07, "loss": 1.1943, "step": 32013 }, { "epoch": 0.87, "learning_rate": 8.174237693222808e-07, "loss": 1.3076, "step": 32014 }, { "epoch": 0.87, "learning_rate": 8.170735549821085e-07, "loss": 1.1257, "step": 32015 }, { "epoch": 0.87, "learning_rate": 8.167234124848344e-07, "loss": 1.2974, "step": 32016 }, { "epoch": 0.87, "learning_rate": 8.163733418331964e-07, "loss": 1.3494, "step": 32017 }, { "epoch": 0.87, "learning_rate": 8.160233430299369e-07, "loss": 1.2329, "step": 32018 }, { "epoch": 0.87, "learning_rate": 8.156734160777913e-07, "loss": 1.2483, "step": 32019 }, { "epoch": 0.87, "learning_rate": 8.153235609794985e-07, "loss": 1.1111, "step": 32020 }, { "epoch": 0.87, "learning_rate": 8.149737777377931e-07, "loss": 1.1465, "step": 32021 }, { "epoch": 0.87, "learning_rate": 8.146240663554161e-07, "loss": 1.2546, "step": 32022 }, { "epoch": 0.87, "learning_rate": 8.142744268351011e-07, "loss": 1.3276, "step": 32023 }, { "epoch": 0.87, "learning_rate": 8.139248591795834e-07, "loss": 1.2034, "step": 32024 }, { "epoch": 0.87, "learning_rate": 8.135753633915966e-07, "loss": 1.2141, "step": 32025 }, { "epoch": 0.87, "learning_rate": 8.132259394738784e-07, "loss": 1.2173, "step": 32026 }, { "epoch": 0.87, "learning_rate": 8.1287658742916e-07, "loss": 1.2334, "step": 32027 }, { "epoch": 0.87, "learning_rate": 8.125273072601725e-07, "loss": 1.1133, "step": 32028 }, { "epoch": 0.87, "learning_rate": 8.121780989696537e-07, "loss": 1.1177, "step": 32029 }, { "epoch": 0.87, "learning_rate": 8.118289625603337e-07, "loss": 1.2073, "step": 32030 }, { "epoch": 0.87, "learning_rate": 8.114798980349426e-07, "loss": 1.1025, "step": 32031 }, { "epoch": 0.87, "learning_rate": 8.111309053962102e-07, "loss": 1.3196, "step": 32032 }, { "epoch": 0.87, "learning_rate": 8.107819846468701e-07, "loss": 1.1626, "step": 32033 }, { "epoch": 0.87, "learning_rate": 8.104331357896512e-07, "loss": 1.1587, "step": 32034 }, { "epoch": 0.87, "learning_rate": 8.100843588272822e-07, "loss": 1.1738, "step": 32035 }, { "epoch": 0.87, "learning_rate": 8.097356537624901e-07, "loss": 1.1685, "step": 32036 }, { "epoch": 0.87, "learning_rate": 8.093870205980059e-07, "loss": 1.2361, "step": 32037 }, { "epoch": 0.87, "learning_rate": 8.090384593365563e-07, "loss": 1.3411, "step": 32038 }, { "epoch": 0.87, "learning_rate": 8.086899699808681e-07, "loss": 1.3318, "step": 32039 }, { "epoch": 0.87, "learning_rate": 8.083415525336657e-07, "loss": 1.3372, "step": 32040 }, { "epoch": 0.88, "learning_rate": 8.079932069976781e-07, "loss": 1.1617, "step": 32041 }, { "epoch": 0.88, "learning_rate": 8.076449333756297e-07, "loss": 1.2134, "step": 32042 }, { "epoch": 0.88, "learning_rate": 8.07296731670243e-07, "loss": 1.1406, "step": 32043 }, { "epoch": 0.88, "learning_rate": 8.069486018842454e-07, "loss": 1.2831, "step": 32044 }, { "epoch": 0.88, "learning_rate": 8.066005440203573e-07, "loss": 1.1934, "step": 32045 }, { "epoch": 0.88, "learning_rate": 8.062525580813074e-07, "loss": 1.3472, "step": 32046 }, { "epoch": 0.88, "learning_rate": 8.059046440698104e-07, "loss": 1.2805, "step": 32047 }, { "epoch": 0.88, "learning_rate": 8.05556801988594e-07, "loss": 1.3008, "step": 32048 }, { "epoch": 0.88, "learning_rate": 8.05209031840376e-07, "loss": 1.1997, "step": 32049 }, { "epoch": 0.88, "learning_rate": 8.048613336278821e-07, "loss": 1.2969, "step": 32050 }, { "epoch": 0.88, "learning_rate": 8.045137073538267e-07, "loss": 1.2898, "step": 32051 }, { "epoch": 0.88, "learning_rate": 8.041661530209322e-07, "loss": 1.3298, "step": 32052 }, { "epoch": 0.88, "learning_rate": 8.038186706319173e-07, "loss": 1.3171, "step": 32053 }, { "epoch": 0.88, "learning_rate": 8.034712601895033e-07, "loss": 1.3328, "step": 32054 }, { "epoch": 0.88, "learning_rate": 8.031239216964026e-07, "loss": 1.4116, "step": 32055 }, { "epoch": 0.88, "learning_rate": 8.027766551553374e-07, "loss": 1.1907, "step": 32056 }, { "epoch": 0.88, "learning_rate": 8.024294605690208e-07, "loss": 1.2849, "step": 32057 }, { "epoch": 0.88, "learning_rate": 8.020823379401732e-07, "loss": 1.2734, "step": 32058 }, { "epoch": 0.88, "learning_rate": 8.017352872715078e-07, "loss": 1.1763, "step": 32059 }, { "epoch": 0.88, "learning_rate": 8.013883085657381e-07, "loss": 1.2949, "step": 32060 }, { "epoch": 0.88, "learning_rate": 8.01041401825583e-07, "loss": 1.2351, "step": 32061 }, { "epoch": 0.88, "learning_rate": 8.006945670537547e-07, "loss": 1.2217, "step": 32062 }, { "epoch": 0.88, "learning_rate": 8.003478042529655e-07, "loss": 1.3184, "step": 32063 }, { "epoch": 0.88, "learning_rate": 8.000011134259277e-07, "loss": 1.5566, "step": 32064 }, { "epoch": 0.88, "learning_rate": 7.99654494575357e-07, "loss": 1.3298, "step": 32065 }, { "epoch": 0.88, "learning_rate": 7.993079477039634e-07, "loss": 1.1372, "step": 32066 }, { "epoch": 0.88, "learning_rate": 7.989614728144579e-07, "loss": 1.2103, "step": 32067 }, { "epoch": 0.88, "learning_rate": 7.986150699095496e-07, "loss": 1.3264, "step": 32068 }, { "epoch": 0.88, "learning_rate": 7.982687389919508e-07, "loss": 1.3936, "step": 32069 }, { "epoch": 0.88, "learning_rate": 7.979224800643715e-07, "loss": 1.282, "step": 32070 }, { "epoch": 0.88, "learning_rate": 7.975762931295195e-07, "loss": 1.1666, "step": 32071 }, { "epoch": 0.88, "learning_rate": 7.972301781901015e-07, "loss": 1.28, "step": 32072 }, { "epoch": 0.88, "learning_rate": 7.968841352488288e-07, "loss": 1.1746, "step": 32073 }, { "epoch": 0.88, "learning_rate": 7.965381643084069e-07, "loss": 1.3037, "step": 32074 }, { "epoch": 0.88, "learning_rate": 7.961922653715404e-07, "loss": 1.2476, "step": 32075 }, { "epoch": 0.88, "learning_rate": 7.958464384409403e-07, "loss": 1.4231, "step": 32076 }, { "epoch": 0.88, "learning_rate": 7.955006835193091e-07, "loss": 1.3003, "step": 32077 }, { "epoch": 0.88, "learning_rate": 7.951550006093523e-07, "loss": 1.335, "step": 32078 }, { "epoch": 0.88, "learning_rate": 7.948093897137732e-07, "loss": 1.2302, "step": 32079 }, { "epoch": 0.88, "learning_rate": 7.944638508352775e-07, "loss": 1.2854, "step": 32080 }, { "epoch": 0.88, "learning_rate": 7.941183839765687e-07, "loss": 1.22, "step": 32081 }, { "epoch": 0.88, "learning_rate": 7.937729891403489e-07, "loss": 1.2417, "step": 32082 }, { "epoch": 0.88, "learning_rate": 7.934276663293183e-07, "loss": 1.2732, "step": 32083 }, { "epoch": 0.88, "learning_rate": 7.930824155461814e-07, "loss": 1.0796, "step": 32084 }, { "epoch": 0.88, "learning_rate": 7.927372367936392e-07, "loss": 1.3135, "step": 32085 }, { "epoch": 0.88, "learning_rate": 7.923921300743908e-07, "loss": 1.3677, "step": 32086 }, { "epoch": 0.88, "learning_rate": 7.920470953911352e-07, "loss": 1.3257, "step": 32087 }, { "epoch": 0.88, "learning_rate": 7.917021327465746e-07, "loss": 1.3157, "step": 32088 }, { "epoch": 0.88, "learning_rate": 7.913572421434068e-07, "loss": 1.7051, "step": 32089 }, { "epoch": 0.88, "learning_rate": 7.910124235843275e-07, "loss": 1.3525, "step": 32090 }, { "epoch": 0.88, "learning_rate": 7.90667677072039e-07, "loss": 1.2942, "step": 32091 }, { "epoch": 0.88, "learning_rate": 7.903230026092334e-07, "loss": 1.249, "step": 32092 }, { "epoch": 0.88, "learning_rate": 7.899784001986144e-07, "loss": 1.2522, "step": 32093 }, { "epoch": 0.88, "learning_rate": 7.896338698428696e-07, "loss": 1.3296, "step": 32094 }, { "epoch": 0.88, "learning_rate": 7.892894115447003e-07, "loss": 1.0867, "step": 32095 }, { "epoch": 0.88, "learning_rate": 7.889450253067976e-07, "loss": 1.2354, "step": 32096 }, { "epoch": 0.88, "learning_rate": 7.886007111318594e-07, "loss": 1.4048, "step": 32097 }, { "epoch": 0.88, "learning_rate": 7.88256469022578e-07, "loss": 1.1562, "step": 32098 }, { "epoch": 0.88, "learning_rate": 7.879122989816467e-07, "loss": 1.2424, "step": 32099 }, { "epoch": 0.88, "learning_rate": 7.875682010117546e-07, "loss": 1.29, "step": 32100 }, { "epoch": 0.88, "learning_rate": 7.872241751155995e-07, "loss": 1.1467, "step": 32101 }, { "epoch": 0.88, "learning_rate": 7.868802212958704e-07, "loss": 1.2278, "step": 32102 }, { "epoch": 0.88, "learning_rate": 7.865363395552583e-07, "loss": 1.1689, "step": 32103 }, { "epoch": 0.88, "learning_rate": 7.861925298964513e-07, "loss": 1.2122, "step": 32104 }, { "epoch": 0.88, "learning_rate": 7.858487923221436e-07, "loss": 1.2983, "step": 32105 }, { "epoch": 0.88, "learning_rate": 7.855051268350211e-07, "loss": 1.2771, "step": 32106 }, { "epoch": 0.88, "learning_rate": 7.851615334377727e-07, "loss": 1.2332, "step": 32107 }, { "epoch": 0.88, "learning_rate": 7.848180121330884e-07, "loss": 1.3018, "step": 32108 }, { "epoch": 0.88, "learning_rate": 7.84474562923655e-07, "loss": 1.1433, "step": 32109 }, { "epoch": 0.88, "learning_rate": 7.841311858121592e-07, "loss": 1.7803, "step": 32110 }, { "epoch": 0.88, "learning_rate": 7.837878808012867e-07, "loss": 1.3264, "step": 32111 }, { "epoch": 0.88, "learning_rate": 7.834446478937241e-07, "loss": 1.0989, "step": 32112 }, { "epoch": 0.88, "learning_rate": 7.831014870921571e-07, "loss": 1.3267, "step": 32113 }, { "epoch": 0.88, "learning_rate": 7.827583983992704e-07, "loss": 1.6978, "step": 32114 }, { "epoch": 0.88, "learning_rate": 7.824153818177461e-07, "loss": 1.3035, "step": 32115 }, { "epoch": 0.88, "learning_rate": 7.820724373502708e-07, "loss": 1.2795, "step": 32116 }, { "epoch": 0.88, "learning_rate": 7.81729564999526e-07, "loss": 1.2932, "step": 32117 }, { "epoch": 0.88, "learning_rate": 7.813867647681949e-07, "loss": 1.2595, "step": 32118 }, { "epoch": 0.88, "learning_rate": 7.810440366589567e-07, "loss": 1.2764, "step": 32119 }, { "epoch": 0.88, "learning_rate": 7.807013806744967e-07, "loss": 1.2473, "step": 32120 }, { "epoch": 0.88, "learning_rate": 7.803587968174942e-07, "loss": 1.332, "step": 32121 }, { "epoch": 0.88, "learning_rate": 7.800162850906267e-07, "loss": 1.3118, "step": 32122 }, { "epoch": 0.88, "learning_rate": 7.79673845496578e-07, "loss": 1.291, "step": 32123 }, { "epoch": 0.88, "learning_rate": 7.793314780380267e-07, "loss": 1.2266, "step": 32124 }, { "epoch": 0.88, "learning_rate": 7.789891827176488e-07, "loss": 1.3145, "step": 32125 }, { "epoch": 0.88, "learning_rate": 7.786469595381219e-07, "loss": 1.175, "step": 32126 }, { "epoch": 0.88, "learning_rate": 7.783048085021272e-07, "loss": 1.3179, "step": 32127 }, { "epoch": 0.88, "learning_rate": 7.779627296123371e-07, "loss": 1.3291, "step": 32128 }, { "epoch": 0.88, "learning_rate": 7.776207228714338e-07, "loss": 1.4319, "step": 32129 }, { "epoch": 0.88, "learning_rate": 7.772787882820865e-07, "loss": 1.3516, "step": 32130 }, { "epoch": 0.88, "learning_rate": 7.769369258469739e-07, "loss": 1.1318, "step": 32131 }, { "epoch": 0.88, "learning_rate": 7.765951355687684e-07, "loss": 1.2898, "step": 32132 }, { "epoch": 0.88, "learning_rate": 7.762534174501491e-07, "loss": 1.196, "step": 32133 }, { "epoch": 0.88, "learning_rate": 7.759117714937813e-07, "loss": 1.1687, "step": 32134 }, { "epoch": 0.88, "learning_rate": 7.755701977023433e-07, "loss": 1.2395, "step": 32135 }, { "epoch": 0.88, "learning_rate": 7.752286960785082e-07, "loss": 1.1914, "step": 32136 }, { "epoch": 0.88, "learning_rate": 7.748872666249463e-07, "loss": 1.3679, "step": 32137 }, { "epoch": 0.88, "learning_rate": 7.745459093443275e-07, "loss": 1.0432, "step": 32138 }, { "epoch": 0.88, "learning_rate": 7.742046242393219e-07, "loss": 1.3848, "step": 32139 }, { "epoch": 0.88, "learning_rate": 7.738634113126031e-07, "loss": 1.1541, "step": 32140 }, { "epoch": 0.88, "learning_rate": 7.735222705668388e-07, "loss": 1.6875, "step": 32141 }, { "epoch": 0.88, "learning_rate": 7.73181202004697e-07, "loss": 1.2129, "step": 32142 }, { "epoch": 0.88, "learning_rate": 7.728402056288453e-07, "loss": 1.2141, "step": 32143 }, { "epoch": 0.88, "learning_rate": 7.724992814419541e-07, "loss": 1.3694, "step": 32144 }, { "epoch": 0.88, "learning_rate": 7.7215842944669e-07, "loss": 1.0544, "step": 32145 }, { "epoch": 0.88, "learning_rate": 7.718176496457197e-07, "loss": 1.2395, "step": 32146 }, { "epoch": 0.88, "learning_rate": 7.714769420417056e-07, "loss": 1.1804, "step": 32147 }, { "epoch": 0.88, "learning_rate": 7.71136306637319e-07, "loss": 1.1716, "step": 32148 }, { "epoch": 0.88, "learning_rate": 7.707957434352221e-07, "loss": 1.3438, "step": 32149 }, { "epoch": 0.88, "learning_rate": 7.704552524380793e-07, "loss": 1.4365, "step": 32150 }, { "epoch": 0.88, "learning_rate": 7.701148336485531e-07, "loss": 1.2507, "step": 32151 }, { "epoch": 0.88, "learning_rate": 7.697744870693091e-07, "loss": 1.3364, "step": 32152 }, { "epoch": 0.88, "learning_rate": 7.694342127030108e-07, "loss": 1.1768, "step": 32153 }, { "epoch": 0.88, "learning_rate": 7.690940105523159e-07, "loss": 1.259, "step": 32154 }, { "epoch": 0.88, "learning_rate": 7.687538806198902e-07, "loss": 1.2688, "step": 32155 }, { "epoch": 0.88, "learning_rate": 7.684138229083937e-07, "loss": 1.2634, "step": 32156 }, { "epoch": 0.88, "learning_rate": 7.680738374204866e-07, "loss": 1.3413, "step": 32157 }, { "epoch": 0.88, "learning_rate": 7.677339241588266e-07, "loss": 1.2415, "step": 32158 }, { "epoch": 0.88, "learning_rate": 7.673940831260773e-07, "loss": 1.2488, "step": 32159 }, { "epoch": 0.88, "learning_rate": 7.670543143248943e-07, "loss": 1.2114, "step": 32160 }, { "epoch": 0.88, "learning_rate": 7.667146177579377e-07, "loss": 1.6792, "step": 32161 }, { "epoch": 0.88, "learning_rate": 7.66374993427862e-07, "loss": 1.293, "step": 32162 }, { "epoch": 0.88, "learning_rate": 7.660354413373283e-07, "loss": 1.3057, "step": 32163 }, { "epoch": 0.88, "learning_rate": 7.656959614889903e-07, "loss": 1.2654, "step": 32164 }, { "epoch": 0.88, "learning_rate": 7.653565538855057e-07, "loss": 1.272, "step": 32165 }, { "epoch": 0.88, "learning_rate": 7.650172185295269e-07, "loss": 1.2732, "step": 32166 }, { "epoch": 0.88, "learning_rate": 7.646779554237116e-07, "loss": 1.1646, "step": 32167 }, { "epoch": 0.88, "learning_rate": 7.643387645707157e-07, "loss": 1.2517, "step": 32168 }, { "epoch": 0.88, "learning_rate": 7.63999645973188e-07, "loss": 1.2288, "step": 32169 }, { "epoch": 0.88, "learning_rate": 7.636605996337842e-07, "loss": 1.1564, "step": 32170 }, { "epoch": 0.88, "learning_rate": 7.633216255551556e-07, "loss": 1.1941, "step": 32171 }, { "epoch": 0.88, "learning_rate": 7.629827237399589e-07, "loss": 1.186, "step": 32172 }, { "epoch": 0.88, "learning_rate": 7.626438941908387e-07, "loss": 1.1984, "step": 32173 }, { "epoch": 0.88, "learning_rate": 7.623051369104506e-07, "loss": 1.3108, "step": 32174 }, { "epoch": 0.88, "learning_rate": 7.619664519014402e-07, "loss": 1.23, "step": 32175 }, { "epoch": 0.88, "learning_rate": 7.616278391664655e-07, "loss": 1.2466, "step": 32176 }, { "epoch": 0.88, "learning_rate": 7.612892987081654e-07, "loss": 1.3076, "step": 32177 }, { "epoch": 0.88, "learning_rate": 7.609508305291957e-07, "loss": 1.2854, "step": 32178 }, { "epoch": 0.88, "learning_rate": 7.606124346322008e-07, "loss": 1.3308, "step": 32179 }, { "epoch": 0.88, "learning_rate": 7.60274111019833e-07, "loss": 1.1633, "step": 32180 }, { "epoch": 0.88, "learning_rate": 7.599358596947326e-07, "loss": 1.4177, "step": 32181 }, { "epoch": 0.88, "learning_rate": 7.595976806595484e-07, "loss": 1.3196, "step": 32182 }, { "epoch": 0.88, "learning_rate": 7.592595739169284e-07, "loss": 1.2742, "step": 32183 }, { "epoch": 0.88, "learning_rate": 7.589215394695171e-07, "loss": 1.26, "step": 32184 }, { "epoch": 0.88, "learning_rate": 7.585835773199579e-07, "loss": 1.3396, "step": 32185 }, { "epoch": 0.88, "learning_rate": 7.582456874708932e-07, "loss": 1.2637, "step": 32186 }, { "epoch": 0.88, "learning_rate": 7.579078699249698e-07, "loss": 1.1194, "step": 32187 }, { "epoch": 0.88, "learning_rate": 7.5757012468483e-07, "loss": 1.2646, "step": 32188 }, { "epoch": 0.88, "learning_rate": 7.572324517531149e-07, "loss": 1.2227, "step": 32189 }, { "epoch": 0.88, "learning_rate": 7.568948511324647e-07, "loss": 1.4373, "step": 32190 }, { "epoch": 0.88, "learning_rate": 7.565573228255252e-07, "loss": 1.6846, "step": 32191 }, { "epoch": 0.88, "learning_rate": 7.562198668349352e-07, "loss": 1.2729, "step": 32192 }, { "epoch": 0.88, "learning_rate": 7.558824831633338e-07, "loss": 1.3618, "step": 32193 }, { "epoch": 0.88, "learning_rate": 7.555451718133588e-07, "loss": 1.1748, "step": 32194 }, { "epoch": 0.88, "learning_rate": 7.552079327876527e-07, "loss": 1.0334, "step": 32195 }, { "epoch": 0.88, "learning_rate": 7.548707660888532e-07, "loss": 1.2224, "step": 32196 }, { "epoch": 0.88, "learning_rate": 7.545336717195961e-07, "loss": 1.1479, "step": 32197 }, { "epoch": 0.88, "learning_rate": 7.541966496825215e-07, "loss": 1.2483, "step": 32198 }, { "epoch": 0.88, "learning_rate": 7.538596999802638e-07, "loss": 1.2092, "step": 32199 }, { "epoch": 0.88, "learning_rate": 7.535228226154612e-07, "loss": 1.3274, "step": 32200 }, { "epoch": 0.88, "learning_rate": 7.531860175907457e-07, "loss": 1.3306, "step": 32201 }, { "epoch": 0.88, "learning_rate": 7.528492849087565e-07, "loss": 1.313, "step": 32202 }, { "epoch": 0.88, "learning_rate": 7.525126245721259e-07, "loss": 1.2754, "step": 32203 }, { "epoch": 0.88, "learning_rate": 7.521760365834885e-07, "loss": 1.3032, "step": 32204 }, { "epoch": 0.88, "learning_rate": 7.518395209454743e-07, "loss": 1.3643, "step": 32205 }, { "epoch": 0.88, "learning_rate": 7.515030776607224e-07, "loss": 1.1316, "step": 32206 }, { "epoch": 0.88, "learning_rate": 7.511667067318596e-07, "loss": 1.2683, "step": 32207 }, { "epoch": 0.88, "learning_rate": 7.508304081615203e-07, "loss": 1.1941, "step": 32208 }, { "epoch": 0.88, "learning_rate": 7.504941819523337e-07, "loss": 1.103, "step": 32209 }, { "epoch": 0.88, "learning_rate": 7.50158028106932e-07, "loss": 1.2322, "step": 32210 }, { "epoch": 0.88, "learning_rate": 7.498219466279444e-07, "loss": 1.2056, "step": 32211 }, { "epoch": 0.88, "learning_rate": 7.494859375179997e-07, "loss": 1.3247, "step": 32212 }, { "epoch": 0.88, "learning_rate": 7.491500007797259e-07, "loss": 1.3887, "step": 32213 }, { "epoch": 0.88, "learning_rate": 7.488141364157531e-07, "loss": 1.1417, "step": 32214 }, { "epoch": 0.88, "learning_rate": 7.484783444287103e-07, "loss": 1.3257, "step": 32215 }, { "epoch": 0.88, "learning_rate": 7.481426248212198e-07, "loss": 1.261, "step": 32216 }, { "epoch": 0.88, "learning_rate": 7.478069775959129e-07, "loss": 1.3713, "step": 32217 }, { "epoch": 0.88, "learning_rate": 7.47471402755412e-07, "loss": 1.2102, "step": 32218 }, { "epoch": 0.88, "learning_rate": 7.47135900302347e-07, "loss": 1.2578, "step": 32219 }, { "epoch": 0.88, "learning_rate": 7.468004702393361e-07, "loss": 1.3457, "step": 32220 }, { "epoch": 0.88, "learning_rate": 7.464651125690092e-07, "loss": 1.2151, "step": 32221 }, { "epoch": 0.88, "learning_rate": 7.461298272939854e-07, "loss": 1.2798, "step": 32222 }, { "epoch": 0.88, "learning_rate": 7.457946144168949e-07, "loss": 1.144, "step": 32223 }, { "epoch": 0.88, "learning_rate": 7.45459473940352e-07, "loss": 1.1517, "step": 32224 }, { "epoch": 0.88, "learning_rate": 7.451244058669837e-07, "loss": 1.2366, "step": 32225 }, { "epoch": 0.88, "learning_rate": 7.447894101994091e-07, "loss": 1.3071, "step": 32226 }, { "epoch": 0.88, "learning_rate": 7.444544869402526e-07, "loss": 1.3765, "step": 32227 }, { "epoch": 0.88, "learning_rate": 7.441196360921288e-07, "loss": 1.0764, "step": 32228 }, { "epoch": 0.88, "learning_rate": 7.437848576576612e-07, "loss": 1.1182, "step": 32229 }, { "epoch": 0.88, "learning_rate": 7.434501516394688e-07, "loss": 1.2051, "step": 32230 }, { "epoch": 0.88, "learning_rate": 7.431155180401705e-07, "loss": 1.1433, "step": 32231 }, { "epoch": 0.88, "learning_rate": 7.427809568623834e-07, "loss": 1.2141, "step": 32232 }, { "epoch": 0.88, "learning_rate": 7.42446468108724e-07, "loss": 1.4048, "step": 32233 }, { "epoch": 0.88, "learning_rate": 7.421120517818103e-07, "loss": 1.2839, "step": 32234 }, { "epoch": 0.88, "learning_rate": 7.417777078842603e-07, "loss": 1.2798, "step": 32235 }, { "epoch": 0.88, "learning_rate": 7.414434364186862e-07, "loss": 1.2764, "step": 32236 }, { "epoch": 0.88, "learning_rate": 7.411092373877049e-07, "loss": 1.1453, "step": 32237 }, { "epoch": 0.88, "learning_rate": 7.40775110793932e-07, "loss": 1.1685, "step": 32238 }, { "epoch": 0.88, "learning_rate": 7.404410566399811e-07, "loss": 1.2893, "step": 32239 }, { "epoch": 0.88, "learning_rate": 7.401070749284644e-07, "loss": 1.3337, "step": 32240 }, { "epoch": 0.88, "learning_rate": 7.397731656619944e-07, "loss": 1.21, "step": 32241 }, { "epoch": 0.88, "learning_rate": 7.394393288431867e-07, "loss": 1.3682, "step": 32242 }, { "epoch": 0.88, "learning_rate": 7.391055644746503e-07, "loss": 1.2771, "step": 32243 }, { "epoch": 0.88, "learning_rate": 7.387718725589965e-07, "loss": 1.3293, "step": 32244 }, { "epoch": 0.88, "learning_rate": 7.384382530988377e-07, "loss": 1.4473, "step": 32245 }, { "epoch": 0.88, "learning_rate": 7.381047060967827e-07, "loss": 1.1973, "step": 32246 }, { "epoch": 0.88, "learning_rate": 7.37771231555442e-07, "loss": 1.3354, "step": 32247 }, { "epoch": 0.88, "learning_rate": 7.374378294774209e-07, "loss": 1.3501, "step": 32248 }, { "epoch": 0.88, "learning_rate": 7.371044998653332e-07, "loss": 1.3584, "step": 32249 }, { "epoch": 0.88, "learning_rate": 7.367712427217844e-07, "loss": 1.248, "step": 32250 }, { "epoch": 0.88, "learning_rate": 7.364380580493813e-07, "loss": 1.2783, "step": 32251 }, { "epoch": 0.88, "learning_rate": 7.361049458507285e-07, "loss": 1.24, "step": 32252 }, { "epoch": 0.88, "learning_rate": 7.357719061284363e-07, "loss": 1.3447, "step": 32253 }, { "epoch": 0.88, "learning_rate": 7.354389388851091e-07, "loss": 1.2947, "step": 32254 }, { "epoch": 0.88, "learning_rate": 7.351060441233504e-07, "loss": 1.137, "step": 32255 }, { "epoch": 0.88, "learning_rate": 7.347732218457638e-07, "loss": 1.1682, "step": 32256 }, { "epoch": 0.88, "learning_rate": 7.34440472054957e-07, "loss": 1.0479, "step": 32257 }, { "epoch": 0.88, "learning_rate": 7.341077947535302e-07, "loss": 1.1968, "step": 32258 }, { "epoch": 0.88, "learning_rate": 7.337751899440859e-07, "loss": 1.3101, "step": 32259 }, { "epoch": 0.88, "learning_rate": 7.334426576292286e-07, "loss": 1.2559, "step": 32260 }, { "epoch": 0.88, "learning_rate": 7.331101978115562e-07, "loss": 1.1143, "step": 32261 }, { "epoch": 0.88, "learning_rate": 7.327778104936755e-07, "loss": 1.2854, "step": 32262 }, { "epoch": 0.88, "learning_rate": 7.324454956781812e-07, "loss": 1.2456, "step": 32263 }, { "epoch": 0.88, "learning_rate": 7.321132533676767e-07, "loss": 1.2866, "step": 32264 }, { "epoch": 0.88, "learning_rate": 7.317810835647576e-07, "loss": 1.3872, "step": 32265 }, { "epoch": 0.88, "learning_rate": 7.314489862720287e-07, "loss": 1.1826, "step": 32266 }, { "epoch": 0.88, "learning_rate": 7.311169614920821e-07, "loss": 1.2812, "step": 32267 }, { "epoch": 0.88, "learning_rate": 7.307850092275181e-07, "loss": 1.2822, "step": 32268 }, { "epoch": 0.88, "learning_rate": 7.304531294809325e-07, "loss": 1.0837, "step": 32269 }, { "epoch": 0.88, "learning_rate": 7.301213222549264e-07, "loss": 1.2598, "step": 32270 }, { "epoch": 0.88, "learning_rate": 7.297895875520889e-07, "loss": 1.3176, "step": 32271 }, { "epoch": 0.88, "learning_rate": 7.294579253750189e-07, "loss": 1.2888, "step": 32272 }, { "epoch": 0.88, "learning_rate": 7.291263357263101e-07, "loss": 1.3203, "step": 32273 }, { "epoch": 0.88, "learning_rate": 7.287948186085614e-07, "loss": 1.2249, "step": 32274 }, { "epoch": 0.88, "learning_rate": 7.284633740243574e-07, "loss": 1.1445, "step": 32275 }, { "epoch": 0.88, "learning_rate": 7.281320019762972e-07, "loss": 1.2393, "step": 32276 }, { "epoch": 0.88, "learning_rate": 7.278007024669742e-07, "loss": 1.3486, "step": 32277 }, { "epoch": 0.88, "learning_rate": 7.274694754989775e-07, "loss": 1.3179, "step": 32278 }, { "epoch": 0.88, "learning_rate": 7.271383210749006e-07, "loss": 1.1682, "step": 32279 }, { "epoch": 0.88, "learning_rate": 7.268072391973302e-07, "loss": 1.1936, "step": 32280 }, { "epoch": 0.88, "learning_rate": 7.264762298688622e-07, "loss": 1.3264, "step": 32281 }, { "epoch": 0.88, "learning_rate": 7.26145293092082e-07, "loss": 1.1614, "step": 32282 }, { "epoch": 0.88, "learning_rate": 7.258144288695812e-07, "loss": 1.3245, "step": 32283 }, { "epoch": 0.88, "learning_rate": 7.254836372039453e-07, "loss": 1.4456, "step": 32284 }, { "epoch": 0.88, "learning_rate": 7.251529180977657e-07, "loss": 1.1968, "step": 32285 }, { "epoch": 0.88, "learning_rate": 7.24822271553629e-07, "loss": 1.4092, "step": 32286 }, { "epoch": 0.88, "learning_rate": 7.244916975741212e-07, "loss": 1.3989, "step": 32287 }, { "epoch": 0.88, "learning_rate": 7.241611961618266e-07, "loss": 1.2615, "step": 32288 }, { "epoch": 0.88, "learning_rate": 7.238307673193346e-07, "loss": 1.105, "step": 32289 }, { "epoch": 0.88, "learning_rate": 7.235004110492294e-07, "loss": 1.0867, "step": 32290 }, { "epoch": 0.88, "learning_rate": 7.231701273540926e-07, "loss": 1.311, "step": 32291 }, { "epoch": 0.88, "learning_rate": 7.228399162365129e-07, "loss": 1.2659, "step": 32292 }, { "epoch": 0.88, "learning_rate": 7.225097776990697e-07, "loss": 1.4048, "step": 32293 }, { "epoch": 0.88, "learning_rate": 7.221797117443486e-07, "loss": 1.2478, "step": 32294 }, { "epoch": 0.88, "learning_rate": 7.218497183749296e-07, "loss": 1.2693, "step": 32295 }, { "epoch": 0.88, "learning_rate": 7.215197975933963e-07, "loss": 1.3047, "step": 32296 }, { "epoch": 0.88, "learning_rate": 7.211899494023289e-07, "loss": 1.3574, "step": 32297 }, { "epoch": 0.88, "learning_rate": 7.208601738043086e-07, "loss": 1.3535, "step": 32298 }, { "epoch": 0.88, "learning_rate": 7.205304708019123e-07, "loss": 1.2615, "step": 32299 }, { "epoch": 0.88, "learning_rate": 7.202008403977245e-07, "loss": 1.3337, "step": 32300 }, { "epoch": 0.88, "learning_rate": 7.198712825943221e-07, "loss": 1.101, "step": 32301 }, { "epoch": 0.88, "learning_rate": 7.19541797394282e-07, "loss": 1.2849, "step": 32302 }, { "epoch": 0.88, "learning_rate": 7.192123848001819e-07, "loss": 1.2029, "step": 32303 }, { "epoch": 0.88, "learning_rate": 7.188830448146023e-07, "loss": 1.2222, "step": 32304 }, { "epoch": 0.88, "learning_rate": 7.185537774401163e-07, "loss": 1.1711, "step": 32305 }, { "epoch": 0.88, "learning_rate": 7.182245826793e-07, "loss": 1.3374, "step": 32306 }, { "epoch": 0.88, "learning_rate": 7.17895460534731e-07, "loss": 1.217, "step": 32307 }, { "epoch": 0.88, "learning_rate": 7.17566411008982e-07, "loss": 1.2463, "step": 32308 }, { "epoch": 0.88, "learning_rate": 7.172374341046318e-07, "loss": 1.3958, "step": 32309 }, { "epoch": 0.88, "learning_rate": 7.169085298242473e-07, "loss": 1.2825, "step": 32310 }, { "epoch": 0.88, "learning_rate": 7.165796981704077e-07, "loss": 1.1313, "step": 32311 }, { "epoch": 0.88, "learning_rate": 7.162509391456807e-07, "loss": 1.2296, "step": 32312 }, { "epoch": 0.88, "learning_rate": 7.159222527526444e-07, "loss": 1.1775, "step": 32313 }, { "epoch": 0.88, "learning_rate": 7.155936389938633e-07, "loss": 1.1235, "step": 32314 }, { "epoch": 0.88, "learning_rate": 7.152650978719133e-07, "loss": 1.1436, "step": 32315 }, { "epoch": 0.88, "learning_rate": 7.149366293893612e-07, "loss": 1.249, "step": 32316 }, { "epoch": 0.88, "learning_rate": 7.146082335487825e-07, "loss": 1.1992, "step": 32317 }, { "epoch": 0.88, "learning_rate": 7.142799103527398e-07, "loss": 1.0494, "step": 32318 }, { "epoch": 0.88, "learning_rate": 7.139516598038054e-07, "loss": 1.4324, "step": 32319 }, { "epoch": 0.88, "learning_rate": 7.136234819045463e-07, "loss": 1.1438, "step": 32320 }, { "epoch": 0.88, "learning_rate": 7.132953766575312e-07, "loss": 1.2119, "step": 32321 }, { "epoch": 0.88, "learning_rate": 7.129673440653251e-07, "loss": 1.1731, "step": 32322 }, { "epoch": 0.88, "learning_rate": 7.126393841304957e-07, "loss": 1.3459, "step": 32323 }, { "epoch": 0.88, "learning_rate": 7.123114968556089e-07, "loss": 1.2722, "step": 32324 }, { "epoch": 0.88, "learning_rate": 7.119836822432302e-07, "loss": 1.2068, "step": 32325 }, { "epoch": 0.88, "learning_rate": 7.116559402959233e-07, "loss": 1.3389, "step": 32326 }, { "epoch": 0.88, "learning_rate": 7.113282710162506e-07, "loss": 1.1964, "step": 32327 }, { "epoch": 0.88, "learning_rate": 7.110006744067799e-07, "loss": 1.1846, "step": 32328 }, { "epoch": 0.88, "learning_rate": 7.106731504700715e-07, "loss": 1.4224, "step": 32329 }, { "epoch": 0.88, "learning_rate": 7.103456992086888e-07, "loss": 1.0369, "step": 32330 }, { "epoch": 0.88, "learning_rate": 7.100183206251909e-07, "loss": 1.302, "step": 32331 }, { "epoch": 0.88, "learning_rate": 7.096910147221436e-07, "loss": 1.1914, "step": 32332 }, { "epoch": 0.88, "learning_rate": 7.093637815021037e-07, "loss": 1.1106, "step": 32333 }, { "epoch": 0.88, "learning_rate": 7.090366209676347e-07, "loss": 1.3, "step": 32334 }, { "epoch": 0.88, "learning_rate": 7.087095331212913e-07, "loss": 1.2983, "step": 32335 }, { "epoch": 0.88, "learning_rate": 7.083825179656379e-07, "loss": 1.219, "step": 32336 }, { "epoch": 0.88, "learning_rate": 7.080555755032292e-07, "loss": 1.3381, "step": 32337 }, { "epoch": 0.88, "learning_rate": 7.077287057366233e-07, "loss": 1.1606, "step": 32338 }, { "epoch": 0.88, "learning_rate": 7.074019086683803e-07, "loss": 1.4829, "step": 32339 }, { "epoch": 0.88, "learning_rate": 7.070751843010559e-07, "loss": 1.2556, "step": 32340 }, { "epoch": 0.88, "learning_rate": 7.067485326372036e-07, "loss": 1.2563, "step": 32341 }, { "epoch": 0.88, "learning_rate": 7.064219536793804e-07, "loss": 1.2944, "step": 32342 }, { "epoch": 0.88, "learning_rate": 7.060954474301429e-07, "loss": 1.1194, "step": 32343 }, { "epoch": 0.88, "learning_rate": 7.057690138920448e-07, "loss": 1.2136, "step": 32344 }, { "epoch": 0.88, "learning_rate": 7.054426530676395e-07, "loss": 1.439, "step": 32345 }, { "epoch": 0.88, "learning_rate": 7.051163649594784e-07, "loss": 1.2876, "step": 32346 }, { "epoch": 0.88, "learning_rate": 7.047901495701171e-07, "loss": 1.2646, "step": 32347 }, { "epoch": 0.88, "learning_rate": 7.044640069021069e-07, "loss": 1.1501, "step": 32348 }, { "epoch": 0.88, "learning_rate": 7.041379369580003e-07, "loss": 1.3252, "step": 32349 }, { "epoch": 0.88, "learning_rate": 7.038119397403442e-07, "loss": 1.2029, "step": 32350 }, { "epoch": 0.88, "learning_rate": 7.034860152516953e-07, "loss": 1.2572, "step": 32351 }, { "epoch": 0.88, "learning_rate": 7.031601634945995e-07, "loss": 1.3357, "step": 32352 }, { "epoch": 0.88, "learning_rate": 7.028343844716046e-07, "loss": 1.3391, "step": 32353 }, { "epoch": 0.88, "learning_rate": 7.025086781852642e-07, "loss": 1.0898, "step": 32354 }, { "epoch": 0.88, "learning_rate": 7.021830446381217e-07, "loss": 1.2766, "step": 32355 }, { "epoch": 0.88, "learning_rate": 7.018574838327307e-07, "loss": 1.2661, "step": 32356 }, { "epoch": 0.88, "learning_rate": 7.015319957716315e-07, "loss": 1.4092, "step": 32357 }, { "epoch": 0.88, "learning_rate": 7.012065804573742e-07, "loss": 1.1833, "step": 32358 }, { "epoch": 0.88, "learning_rate": 7.008812378925023e-07, "loss": 1.3665, "step": 32359 }, { "epoch": 0.88, "learning_rate": 7.005559680795659e-07, "loss": 1.2124, "step": 32360 }, { "epoch": 0.88, "learning_rate": 7.002307710211054e-07, "loss": 1.4077, "step": 32361 }, { "epoch": 0.88, "learning_rate": 6.999056467196663e-07, "loss": 1.1934, "step": 32362 }, { "epoch": 0.88, "learning_rate": 6.995805951777912e-07, "loss": 1.2117, "step": 32363 }, { "epoch": 0.88, "learning_rate": 6.992556163980257e-07, "loss": 1.2578, "step": 32364 }, { "epoch": 0.88, "learning_rate": 6.989307103829101e-07, "loss": 1.2871, "step": 32365 }, { "epoch": 0.88, "learning_rate": 6.986058771349879e-07, "loss": 1.3264, "step": 32366 }, { "epoch": 0.88, "learning_rate": 6.982811166567971e-07, "loss": 1.082, "step": 32367 }, { "epoch": 0.88, "learning_rate": 6.979564289508834e-07, "loss": 1.2771, "step": 32368 }, { "epoch": 0.88, "learning_rate": 6.976318140197835e-07, "loss": 1.2693, "step": 32369 }, { "epoch": 0.88, "learning_rate": 6.973072718660368e-07, "loss": 1.3376, "step": 32370 }, { "epoch": 0.88, "learning_rate": 6.969828024921843e-07, "loss": 1.3171, "step": 32371 }, { "epoch": 0.88, "learning_rate": 6.966584059007653e-07, "loss": 1.3765, "step": 32372 }, { "epoch": 0.88, "learning_rate": 6.963340820943154e-07, "loss": 1.2925, "step": 32373 }, { "epoch": 0.88, "learning_rate": 6.960098310753716e-07, "loss": 1.1309, "step": 32374 }, { "epoch": 0.88, "learning_rate": 6.956856528464729e-07, "loss": 1.2908, "step": 32375 }, { "epoch": 0.88, "learning_rate": 6.953615474101538e-07, "loss": 1.0886, "step": 32376 }, { "epoch": 0.88, "learning_rate": 6.950375147689514e-07, "loss": 1.1592, "step": 32377 }, { "epoch": 0.88, "learning_rate": 6.947135549253992e-07, "loss": 1.2905, "step": 32378 }, { "epoch": 0.88, "learning_rate": 6.943896678820327e-07, "loss": 1.3203, "step": 32379 }, { "epoch": 0.88, "learning_rate": 6.940658536413869e-07, "loss": 1.2568, "step": 32380 }, { "epoch": 0.88, "learning_rate": 6.937421122059929e-07, "loss": 1.3896, "step": 32381 }, { "epoch": 0.88, "learning_rate": 6.934184435783831e-07, "loss": 1.3003, "step": 32382 }, { "epoch": 0.88, "learning_rate": 6.930948477610932e-07, "loss": 1.3538, "step": 32383 }, { "epoch": 0.88, "learning_rate": 6.927713247566525e-07, "loss": 1.1758, "step": 32384 }, { "epoch": 0.88, "learning_rate": 6.9244787456759e-07, "loss": 1.2708, "step": 32385 }, { "epoch": 0.88, "learning_rate": 6.921244971964414e-07, "loss": 1.2795, "step": 32386 }, { "epoch": 0.88, "learning_rate": 6.918011926457335e-07, "loss": 1.5117, "step": 32387 }, { "epoch": 0.88, "learning_rate": 6.914779609179955e-07, "loss": 1.2327, "step": 32388 }, { "epoch": 0.88, "learning_rate": 6.911548020157566e-07, "loss": 1.113, "step": 32389 }, { "epoch": 0.88, "learning_rate": 6.908317159415456e-07, "loss": 1.1169, "step": 32390 }, { "epoch": 0.88, "learning_rate": 6.905087026978896e-07, "loss": 1.1809, "step": 32391 }, { "epoch": 0.88, "learning_rate": 6.901857622873165e-07, "loss": 1.3242, "step": 32392 }, { "epoch": 0.88, "learning_rate": 6.898628947123509e-07, "loss": 1.1501, "step": 32393 }, { "epoch": 0.88, "learning_rate": 6.895400999755209e-07, "loss": 1.2966, "step": 32394 }, { "epoch": 0.88, "learning_rate": 6.892173780793499e-07, "loss": 1.3054, "step": 32395 }, { "epoch": 0.88, "learning_rate": 6.88894729026367e-07, "loss": 1.3904, "step": 32396 }, { "epoch": 0.88, "learning_rate": 6.885721528190903e-07, "loss": 1.3208, "step": 32397 }, { "epoch": 0.88, "learning_rate": 6.882496494600477e-07, "loss": 1.2993, "step": 32398 }, { "epoch": 0.88, "learning_rate": 6.879272189517594e-07, "loss": 1.2986, "step": 32399 }, { "epoch": 0.88, "learning_rate": 6.876048612967523e-07, "loss": 1.3269, "step": 32400 }, { "epoch": 0.88, "learning_rate": 6.872825764975444e-07, "loss": 1.2756, "step": 32401 }, { "epoch": 0.88, "learning_rate": 6.86960364556658e-07, "loss": 1.0405, "step": 32402 }, { "epoch": 0.88, "learning_rate": 6.866382254766158e-07, "loss": 1.2915, "step": 32403 }, { "epoch": 0.88, "learning_rate": 6.863161592599366e-07, "loss": 1.1487, "step": 32404 }, { "epoch": 0.88, "learning_rate": 6.859941659091396e-07, "loss": 1.2998, "step": 32405 }, { "epoch": 0.88, "learning_rate": 6.85672245426744e-07, "loss": 1.3784, "step": 32406 }, { "epoch": 0.89, "learning_rate": 6.853503978152698e-07, "loss": 1.2754, "step": 32407 }, { "epoch": 0.89, "learning_rate": 6.85028623077234e-07, "loss": 1.2632, "step": 32408 }, { "epoch": 0.89, "learning_rate": 6.847069212151536e-07, "loss": 1.261, "step": 32409 }, { "epoch": 0.89, "learning_rate": 6.843852922315452e-07, "loss": 1.3027, "step": 32410 }, { "epoch": 0.89, "learning_rate": 6.840637361289271e-07, "loss": 1.2747, "step": 32411 }, { "epoch": 0.89, "learning_rate": 6.837422529098126e-07, "loss": 1.151, "step": 32412 }, { "epoch": 0.89, "learning_rate": 6.834208425767197e-07, "loss": 1.0955, "step": 32413 }, { "epoch": 0.89, "learning_rate": 6.830995051321577e-07, "loss": 1.6621, "step": 32414 }, { "epoch": 0.89, "learning_rate": 6.827782405786476e-07, "loss": 1.0789, "step": 32415 }, { "epoch": 0.89, "learning_rate": 6.824570489186977e-07, "loss": 1.272, "step": 32416 }, { "epoch": 0.89, "learning_rate": 6.821359301548214e-07, "loss": 1.0735, "step": 32417 }, { "epoch": 0.89, "learning_rate": 6.818148842895333e-07, "loss": 1.168, "step": 32418 }, { "epoch": 0.89, "learning_rate": 6.814939113253449e-07, "loss": 1.3645, "step": 32419 }, { "epoch": 0.89, "learning_rate": 6.811730112647652e-07, "loss": 1.3352, "step": 32420 }, { "epoch": 0.89, "learning_rate": 6.808521841103044e-07, "loss": 1.3533, "step": 32421 }, { "epoch": 0.89, "learning_rate": 6.805314298644761e-07, "loss": 1.3591, "step": 32422 }, { "epoch": 0.89, "learning_rate": 6.802107485297871e-07, "loss": 1.4109, "step": 32423 }, { "epoch": 0.89, "learning_rate": 6.798901401087465e-07, "loss": 1.29, "step": 32424 }, { "epoch": 0.89, "learning_rate": 6.795696046038625e-07, "loss": 1.3777, "step": 32425 }, { "epoch": 0.89, "learning_rate": 6.792491420176428e-07, "loss": 1.1616, "step": 32426 }, { "epoch": 0.89, "learning_rate": 6.789287523525967e-07, "loss": 1.2837, "step": 32427 }, { "epoch": 0.89, "learning_rate": 6.786084356112277e-07, "loss": 1.2944, "step": 32428 }, { "epoch": 0.89, "learning_rate": 6.782881917960427e-07, "loss": 1.2603, "step": 32429 }, { "epoch": 0.89, "learning_rate": 6.779680209095462e-07, "loss": 1.0667, "step": 32430 }, { "epoch": 0.89, "learning_rate": 6.776479229542476e-07, "loss": 1.4446, "step": 32431 }, { "epoch": 0.89, "learning_rate": 6.773278979326459e-07, "loss": 1.2512, "step": 32432 }, { "epoch": 0.89, "learning_rate": 6.770079458472478e-07, "loss": 1.3171, "step": 32433 }, { "epoch": 0.89, "learning_rate": 6.766880667005538e-07, "loss": 1.3975, "step": 32434 }, { "epoch": 0.89, "learning_rate": 6.763682604950716e-07, "loss": 1.2827, "step": 32435 }, { "epoch": 0.89, "learning_rate": 6.760485272332973e-07, "loss": 1.1992, "step": 32436 }, { "epoch": 0.89, "learning_rate": 6.757288669177354e-07, "loss": 1.3999, "step": 32437 }, { "epoch": 0.89, "learning_rate": 6.754092795508848e-07, "loss": 1.2202, "step": 32438 }, { "epoch": 0.89, "learning_rate": 6.750897651352517e-07, "loss": 1.3171, "step": 32439 }, { "epoch": 0.89, "learning_rate": 6.747703236733271e-07, "loss": 1.2144, "step": 32440 }, { "epoch": 0.89, "learning_rate": 6.744509551676159e-07, "loss": 1.2761, "step": 32441 }, { "epoch": 0.89, "learning_rate": 6.741316596206149e-07, "loss": 1.1692, "step": 32442 }, { "epoch": 0.89, "learning_rate": 6.738124370348242e-07, "loss": 1.127, "step": 32443 }, { "epoch": 0.89, "learning_rate": 6.734932874127375e-07, "loss": 1.2888, "step": 32444 }, { "epoch": 0.89, "learning_rate": 6.731742107568529e-07, "loss": 1.3794, "step": 32445 }, { "epoch": 0.89, "learning_rate": 6.728552070696692e-07, "loss": 1.3027, "step": 32446 }, { "epoch": 0.89, "learning_rate": 6.725362763536802e-07, "loss": 1.2654, "step": 32447 }, { "epoch": 0.89, "learning_rate": 6.722174186113817e-07, "loss": 1.2534, "step": 32448 }, { "epoch": 0.89, "learning_rate": 6.71898633845266e-07, "loss": 1.2229, "step": 32449 }, { "epoch": 0.89, "learning_rate": 6.715799220578311e-07, "loss": 1.2605, "step": 32450 }, { "epoch": 0.89, "learning_rate": 6.712612832515686e-07, "loss": 1.2458, "step": 32451 }, { "epoch": 0.89, "learning_rate": 6.709427174289695e-07, "loss": 1.3401, "step": 32452 }, { "epoch": 0.89, "learning_rate": 6.706242245925276e-07, "loss": 1.26, "step": 32453 }, { "epoch": 0.89, "learning_rate": 6.703058047447364e-07, "loss": 1.2341, "step": 32454 }, { "epoch": 0.89, "learning_rate": 6.699874578880849e-07, "loss": 1.2771, "step": 32455 }, { "epoch": 0.89, "learning_rate": 6.696691840250646e-07, "loss": 1.27, "step": 32456 }, { "epoch": 0.89, "learning_rate": 6.693509831581635e-07, "loss": 1.6743, "step": 32457 }, { "epoch": 0.89, "learning_rate": 6.69032855289874e-07, "loss": 1.2566, "step": 32458 }, { "epoch": 0.89, "learning_rate": 6.68714800422684e-07, "loss": 1.1415, "step": 32459 }, { "epoch": 0.89, "learning_rate": 6.683968185590817e-07, "loss": 1.3494, "step": 32460 }, { "epoch": 0.89, "learning_rate": 6.680789097015528e-07, "loss": 1.2751, "step": 32461 }, { "epoch": 0.89, "learning_rate": 6.677610738525875e-07, "loss": 1.1709, "step": 32462 }, { "epoch": 0.89, "learning_rate": 6.674433110146716e-07, "loss": 1.2961, "step": 32463 }, { "epoch": 0.89, "learning_rate": 6.671256211902899e-07, "loss": 1.2651, "step": 32464 }, { "epoch": 0.89, "learning_rate": 6.668080043819292e-07, "loss": 1.2402, "step": 32465 }, { "epoch": 0.89, "learning_rate": 6.664904605920752e-07, "loss": 1.3289, "step": 32466 }, { "epoch": 0.89, "learning_rate": 6.661729898232094e-07, "loss": 1.1951, "step": 32467 }, { "epoch": 0.89, "learning_rate": 6.658555920778165e-07, "loss": 1.3223, "step": 32468 }, { "epoch": 0.89, "learning_rate": 6.65538267358381e-07, "loss": 1.234, "step": 32469 }, { "epoch": 0.89, "learning_rate": 6.652210156673855e-07, "loss": 1.2202, "step": 32470 }, { "epoch": 0.89, "learning_rate": 6.649038370073113e-07, "loss": 1.166, "step": 32471 }, { "epoch": 0.89, "learning_rate": 6.645867313806375e-07, "loss": 1.4019, "step": 32472 }, { "epoch": 0.89, "learning_rate": 6.642696987898489e-07, "loss": 1.2861, "step": 32473 }, { "epoch": 0.89, "learning_rate": 6.639527392374245e-07, "loss": 1.1746, "step": 32474 }, { "epoch": 0.89, "learning_rate": 6.636358527258447e-07, "loss": 1.2048, "step": 32475 }, { "epoch": 0.89, "learning_rate": 6.63319039257585e-07, "loss": 1.2688, "step": 32476 }, { "epoch": 0.89, "learning_rate": 6.63002298835127e-07, "loss": 1.1975, "step": 32477 }, { "epoch": 0.89, "learning_rate": 6.626856314609509e-07, "loss": 1.2683, "step": 32478 }, { "epoch": 0.89, "learning_rate": 6.623690371375291e-07, "loss": 1.1099, "step": 32479 }, { "epoch": 0.89, "learning_rate": 6.62052515867343e-07, "loss": 1.3853, "step": 32480 }, { "epoch": 0.89, "learning_rate": 6.617360676528651e-07, "loss": 1.1343, "step": 32481 }, { "epoch": 0.89, "learning_rate": 6.614196924965766e-07, "loss": 1.2369, "step": 32482 }, { "epoch": 0.89, "learning_rate": 6.611033904009456e-07, "loss": 1.269, "step": 32483 }, { "epoch": 0.89, "learning_rate": 6.607871613684525e-07, "loss": 1.1379, "step": 32484 }, { "epoch": 0.89, "learning_rate": 6.604710054015662e-07, "loss": 1.3213, "step": 32485 }, { "epoch": 0.89, "learning_rate": 6.60154922502767e-07, "loss": 1.1577, "step": 32486 }, { "epoch": 0.89, "learning_rate": 6.598389126745209e-07, "loss": 1.3848, "step": 32487 }, { "epoch": 0.89, "learning_rate": 6.595229759193034e-07, "loss": 1.2783, "step": 32488 }, { "epoch": 0.89, "learning_rate": 6.592071122395849e-07, "loss": 1.1445, "step": 32489 }, { "epoch": 0.89, "learning_rate": 6.588913216378412e-07, "loss": 1.1802, "step": 32490 }, { "epoch": 0.89, "learning_rate": 6.585756041165359e-07, "loss": 1.2374, "step": 32491 }, { "epoch": 0.89, "learning_rate": 6.582599596781424e-07, "loss": 1.2417, "step": 32492 }, { "epoch": 0.89, "learning_rate": 6.579443883251324e-07, "loss": 1.3252, "step": 32493 }, { "epoch": 0.89, "learning_rate": 6.576288900599715e-07, "loss": 1.105, "step": 32494 }, { "epoch": 0.89, "learning_rate": 6.573134648851298e-07, "loss": 1.3486, "step": 32495 }, { "epoch": 0.89, "learning_rate": 6.569981128030722e-07, "loss": 1.1765, "step": 32496 }, { "epoch": 0.89, "learning_rate": 6.566828338162701e-07, "loss": 1.1057, "step": 32497 }, { "epoch": 0.89, "learning_rate": 6.56367627927188e-07, "loss": 1.1667, "step": 32498 }, { "epoch": 0.89, "learning_rate": 6.560524951382918e-07, "loss": 1.0901, "step": 32499 }, { "epoch": 0.89, "learning_rate": 6.557374354520452e-07, "loss": 1.3013, "step": 32500 }, { "epoch": 0.89, "learning_rate": 6.55422448870916e-07, "loss": 1.157, "step": 32501 }, { "epoch": 0.89, "learning_rate": 6.551075353973679e-07, "loss": 1.384, "step": 32502 }, { "epoch": 0.89, "learning_rate": 6.547926950338645e-07, "loss": 1.2327, "step": 32503 }, { "epoch": 0.89, "learning_rate": 6.544779277828673e-07, "loss": 1.0898, "step": 32504 }, { "epoch": 0.89, "learning_rate": 6.541632336468417e-07, "loss": 1.3455, "step": 32505 }, { "epoch": 0.89, "learning_rate": 6.538486126282472e-07, "loss": 1.2808, "step": 32506 }, { "epoch": 0.89, "learning_rate": 6.535340647295452e-07, "loss": 1.1997, "step": 32507 }, { "epoch": 0.89, "learning_rate": 6.532195899532001e-07, "loss": 1.2542, "step": 32508 }, { "epoch": 0.89, "learning_rate": 6.529051883016691e-07, "loss": 1.3418, "step": 32509 }, { "epoch": 0.89, "learning_rate": 6.525908597774122e-07, "loss": 1.2593, "step": 32510 }, { "epoch": 0.89, "learning_rate": 6.522766043828876e-07, "loss": 1.2637, "step": 32511 }, { "epoch": 0.89, "learning_rate": 6.519624221205567e-07, "loss": 1.2346, "step": 32512 }, { "epoch": 0.89, "learning_rate": 6.516483129928763e-07, "loss": 1.2268, "step": 32513 }, { "epoch": 0.89, "learning_rate": 6.513342770023045e-07, "loss": 1.0886, "step": 32514 }, { "epoch": 0.89, "learning_rate": 6.51020314151295e-07, "loss": 1.2563, "step": 32515 }, { "epoch": 0.89, "learning_rate": 6.507064244423067e-07, "loss": 1.4412, "step": 32516 }, { "epoch": 0.89, "learning_rate": 6.503926078777967e-07, "loss": 1.3105, "step": 32517 }, { "epoch": 0.89, "learning_rate": 6.500788644602174e-07, "loss": 1.3093, "step": 32518 }, { "epoch": 0.89, "learning_rate": 6.497651941920236e-07, "loss": 1.323, "step": 32519 }, { "epoch": 0.89, "learning_rate": 6.494515970756709e-07, "loss": 1.1597, "step": 32520 }, { "epoch": 0.89, "learning_rate": 6.491380731136121e-07, "loss": 1.3259, "step": 32521 }, { "epoch": 0.89, "learning_rate": 6.488246223083006e-07, "loss": 1.1462, "step": 32522 }, { "epoch": 0.89, "learning_rate": 6.485112446621866e-07, "loss": 1.3853, "step": 32523 }, { "epoch": 0.89, "learning_rate": 6.481979401777228e-07, "loss": 1.3159, "step": 32524 }, { "epoch": 0.89, "learning_rate": 6.478847088573637e-07, "loss": 1.2119, "step": 32525 }, { "epoch": 0.89, "learning_rate": 6.47571550703554e-07, "loss": 1.2396, "step": 32526 }, { "epoch": 0.89, "learning_rate": 6.472584657187475e-07, "loss": 1.2539, "step": 32527 }, { "epoch": 0.89, "learning_rate": 6.469454539053921e-07, "loss": 1.2151, "step": 32528 }, { "epoch": 0.89, "learning_rate": 6.466325152659403e-07, "loss": 1.4111, "step": 32529 }, { "epoch": 0.89, "learning_rate": 6.463196498028345e-07, "loss": 1.3652, "step": 32530 }, { "epoch": 0.89, "learning_rate": 6.460068575185263e-07, "loss": 1.3435, "step": 32531 }, { "epoch": 0.89, "learning_rate": 6.456941384154613e-07, "loss": 1.1624, "step": 32532 }, { "epoch": 0.89, "learning_rate": 6.453814924960889e-07, "loss": 1.3313, "step": 32533 }, { "epoch": 0.89, "learning_rate": 6.450689197628501e-07, "loss": 1.2573, "step": 32534 }, { "epoch": 0.89, "learning_rate": 6.447564202181955e-07, "loss": 1.2495, "step": 32535 }, { "epoch": 0.89, "learning_rate": 6.444439938645641e-07, "loss": 1.7026, "step": 32536 }, { "epoch": 0.89, "learning_rate": 6.441316407044085e-07, "loss": 1.3132, "step": 32537 }, { "epoch": 0.89, "learning_rate": 6.438193607401632e-07, "loss": 1.2773, "step": 32538 }, { "epoch": 0.89, "learning_rate": 6.435071539742765e-07, "loss": 1.0667, "step": 32539 }, { "epoch": 0.89, "learning_rate": 6.431950204091908e-07, "loss": 1.2876, "step": 32540 }, { "epoch": 0.89, "learning_rate": 6.428829600473474e-07, "loss": 1.1694, "step": 32541 }, { "epoch": 0.89, "learning_rate": 6.425709728911888e-07, "loss": 1.1111, "step": 32542 }, { "epoch": 0.89, "learning_rate": 6.422590589431521e-07, "loss": 1.1609, "step": 32543 }, { "epoch": 0.89, "learning_rate": 6.419472182056819e-07, "loss": 1.2681, "step": 32544 }, { "epoch": 0.89, "learning_rate": 6.416354506812162e-07, "loss": 1.3589, "step": 32545 }, { "epoch": 0.89, "learning_rate": 6.413237563721941e-07, "loss": 1.2087, "step": 32546 }, { "epoch": 0.89, "learning_rate": 6.410121352810528e-07, "loss": 1.1726, "step": 32547 }, { "epoch": 0.89, "learning_rate": 6.407005874102335e-07, "loss": 1.3767, "step": 32548 }, { "epoch": 0.89, "learning_rate": 6.403891127621719e-07, "loss": 1.1301, "step": 32549 }, { "epoch": 0.89, "learning_rate": 6.400777113393042e-07, "loss": 1.1943, "step": 32550 }, { "epoch": 0.89, "learning_rate": 6.397663831440659e-07, "loss": 1.3022, "step": 32551 }, { "epoch": 0.89, "learning_rate": 6.394551281788952e-07, "loss": 1.1851, "step": 32552 }, { "epoch": 0.89, "learning_rate": 6.391439464462257e-07, "loss": 1.1641, "step": 32553 }, { "epoch": 0.89, "learning_rate": 6.388328379484909e-07, "loss": 1.2996, "step": 32554 }, { "epoch": 0.89, "learning_rate": 6.385218026881279e-07, "loss": 1.1458, "step": 32555 }, { "epoch": 0.89, "learning_rate": 6.38210840667568e-07, "loss": 1.134, "step": 32556 }, { "epoch": 0.89, "learning_rate": 6.378999518892437e-07, "loss": 1.3027, "step": 32557 }, { "epoch": 0.89, "learning_rate": 6.375891363555864e-07, "loss": 1.1443, "step": 32558 }, { "epoch": 0.89, "learning_rate": 6.372783940690319e-07, "loss": 1.2224, "step": 32559 }, { "epoch": 0.89, "learning_rate": 6.369677250320072e-07, "loss": 1.6196, "step": 32560 }, { "epoch": 0.89, "learning_rate": 6.366571292469448e-07, "loss": 1.1812, "step": 32561 }, { "epoch": 0.89, "learning_rate": 6.363466067162727e-07, "loss": 1.2295, "step": 32562 }, { "epoch": 0.89, "learning_rate": 6.360361574424234e-07, "loss": 1.2581, "step": 32563 }, { "epoch": 0.89, "learning_rate": 6.357257814278228e-07, "loss": 1.2678, "step": 32564 }, { "epoch": 0.89, "learning_rate": 6.354154786749012e-07, "loss": 1.325, "step": 32565 }, { "epoch": 0.89, "learning_rate": 6.351052491860843e-07, "loss": 1.1392, "step": 32566 }, { "epoch": 0.89, "learning_rate": 6.347950929638003e-07, "loss": 1.2454, "step": 32567 }, { "epoch": 0.89, "learning_rate": 6.344850100104771e-07, "loss": 1.231, "step": 32568 }, { "epoch": 0.89, "learning_rate": 6.341750003285375e-07, "loss": 1.2969, "step": 32569 }, { "epoch": 0.89, "learning_rate": 6.338650639204092e-07, "loss": 1.4292, "step": 32570 }, { "epoch": 0.89, "learning_rate": 6.335552007885148e-07, "loss": 1.4204, "step": 32571 }, { "epoch": 0.89, "learning_rate": 6.332454109352837e-07, "loss": 1.2715, "step": 32572 }, { "epoch": 0.89, "learning_rate": 6.329356943631337e-07, "loss": 1.2039, "step": 32573 }, { "epoch": 0.89, "learning_rate": 6.326260510744909e-07, "loss": 1.2499, "step": 32574 }, { "epoch": 0.89, "learning_rate": 6.323164810717753e-07, "loss": 1.2722, "step": 32575 }, { "epoch": 0.89, "learning_rate": 6.320069843574139e-07, "loss": 1.2681, "step": 32576 }, { "epoch": 0.89, "learning_rate": 6.316975609338216e-07, "loss": 1.3076, "step": 32577 }, { "epoch": 0.89, "learning_rate": 6.31388210803423e-07, "loss": 1.6396, "step": 32578 }, { "epoch": 0.89, "learning_rate": 6.310789339686374e-07, "loss": 1.1921, "step": 32579 }, { "epoch": 0.89, "learning_rate": 6.307697304318871e-07, "loss": 1.3669, "step": 32580 }, { "epoch": 0.89, "learning_rate": 6.304606001955848e-07, "loss": 1.1528, "step": 32581 }, { "epoch": 0.89, "learning_rate": 6.301515432621564e-07, "loss": 1.3115, "step": 32582 }, { "epoch": 0.89, "learning_rate": 6.29842559634013e-07, "loss": 1.2727, "step": 32583 }, { "epoch": 0.89, "learning_rate": 6.295336493135795e-07, "loss": 1.2712, "step": 32584 }, { "epoch": 0.89, "learning_rate": 6.29224812303264e-07, "loss": 1.2891, "step": 32585 }, { "epoch": 0.89, "learning_rate": 6.28916048605488e-07, "loss": 1.3672, "step": 32586 }, { "epoch": 0.89, "learning_rate": 6.286073582226681e-07, "loss": 1.2043, "step": 32587 }, { "epoch": 0.89, "learning_rate": 6.282987411572172e-07, "loss": 1.2947, "step": 32588 }, { "epoch": 0.89, "learning_rate": 6.279901974115499e-07, "loss": 1.2986, "step": 32589 }, { "epoch": 0.89, "learning_rate": 6.276817269880786e-07, "loss": 1.1296, "step": 32590 }, { "epoch": 0.89, "learning_rate": 6.273733298892204e-07, "loss": 1.1487, "step": 32591 }, { "epoch": 0.89, "learning_rate": 6.270650061173855e-07, "loss": 1.1335, "step": 32592 }, { "epoch": 0.89, "learning_rate": 6.267567556749865e-07, "loss": 1.3708, "step": 32593 }, { "epoch": 0.89, "learning_rate": 6.264485785644336e-07, "loss": 1.2017, "step": 32594 }, { "epoch": 0.89, "learning_rate": 6.261404747881417e-07, "loss": 1.3738, "step": 32595 }, { "epoch": 0.89, "learning_rate": 6.258324443485175e-07, "loss": 1.281, "step": 32596 }, { "epoch": 0.89, "learning_rate": 6.255244872479727e-07, "loss": 1.313, "step": 32597 }, { "epoch": 0.89, "learning_rate": 6.252166034889151e-07, "loss": 1.3521, "step": 32598 }, { "epoch": 0.89, "learning_rate": 6.249087930737551e-07, "loss": 1.1172, "step": 32599 }, { "epoch": 0.89, "learning_rate": 6.24601056004901e-07, "loss": 1.1658, "step": 32600 }, { "epoch": 0.89, "learning_rate": 6.242933922847572e-07, "loss": 1.2656, "step": 32601 }, { "epoch": 0.89, "learning_rate": 6.239858019157352e-07, "loss": 1.3726, "step": 32602 }, { "epoch": 0.89, "learning_rate": 6.236782849002387e-07, "loss": 1.3723, "step": 32603 }, { "epoch": 0.89, "learning_rate": 6.233708412406758e-07, "loss": 1.2117, "step": 32604 }, { "epoch": 0.89, "learning_rate": 6.230634709394479e-07, "loss": 1.1692, "step": 32605 }, { "epoch": 0.89, "learning_rate": 6.22756173998963e-07, "loss": 1.2502, "step": 32606 }, { "epoch": 0.89, "learning_rate": 6.224489504216247e-07, "loss": 1.136, "step": 32607 }, { "epoch": 0.89, "learning_rate": 6.221418002098367e-07, "loss": 1.3286, "step": 32608 }, { "epoch": 0.89, "learning_rate": 6.218347233659993e-07, "loss": 1.4023, "step": 32609 }, { "epoch": 0.89, "learning_rate": 6.215277198925185e-07, "loss": 1.141, "step": 32610 }, { "epoch": 0.89, "learning_rate": 6.212207897917955e-07, "loss": 1.2646, "step": 32611 }, { "epoch": 0.89, "learning_rate": 6.209139330662295e-07, "loss": 1.0928, "step": 32612 }, { "epoch": 0.89, "learning_rate": 6.20607149718222e-07, "loss": 1.0702, "step": 32613 }, { "epoch": 0.89, "learning_rate": 6.203004397501755e-07, "loss": 1.376, "step": 32614 }, { "epoch": 0.89, "learning_rate": 6.19993803164487e-07, "loss": 1.2444, "step": 32615 }, { "epoch": 0.89, "learning_rate": 6.196872399635556e-07, "loss": 1.1902, "step": 32616 }, { "epoch": 0.89, "learning_rate": 6.193807501497806e-07, "loss": 1.2356, "step": 32617 }, { "epoch": 0.89, "learning_rate": 6.190743337255589e-07, "loss": 1.3342, "step": 32618 }, { "epoch": 0.89, "learning_rate": 6.187679906932909e-07, "loss": 1.282, "step": 32619 }, { "epoch": 0.89, "learning_rate": 6.184617210553678e-07, "loss": 1.5391, "step": 32620 }, { "epoch": 0.89, "learning_rate": 6.181555248141902e-07, "loss": 1.2225, "step": 32621 }, { "epoch": 0.89, "learning_rate": 6.178494019721515e-07, "loss": 1.2135, "step": 32622 }, { "epoch": 0.89, "learning_rate": 6.175433525316477e-07, "loss": 1.1953, "step": 32623 }, { "epoch": 0.89, "learning_rate": 6.172373764950734e-07, "loss": 1.3406, "step": 32624 }, { "epoch": 0.89, "learning_rate": 6.169314738648213e-07, "loss": 1.3635, "step": 32625 }, { "epoch": 0.89, "learning_rate": 6.166256446432838e-07, "loss": 1.1807, "step": 32626 }, { "epoch": 0.89, "learning_rate": 6.16319888832857e-07, "loss": 1.2441, "step": 32627 }, { "epoch": 0.89, "learning_rate": 6.160142064359298e-07, "loss": 1.2102, "step": 32628 }, { "epoch": 0.89, "learning_rate": 6.157085974548949e-07, "loss": 1.2925, "step": 32629 }, { "epoch": 0.89, "learning_rate": 6.154030618921425e-07, "loss": 1.2644, "step": 32630 }, { "epoch": 0.89, "learning_rate": 6.150975997500641e-07, "loss": 1.333, "step": 32631 }, { "epoch": 0.89, "learning_rate": 6.1479221103105e-07, "loss": 1.0662, "step": 32632 }, { "epoch": 0.89, "learning_rate": 6.144868957374861e-07, "loss": 1.3645, "step": 32633 }, { "epoch": 0.89, "learning_rate": 6.14181653871766e-07, "loss": 1.2197, "step": 32634 }, { "epoch": 0.89, "learning_rate": 6.138764854362733e-07, "loss": 1.2729, "step": 32635 }, { "epoch": 0.89, "learning_rate": 6.135713904333984e-07, "loss": 1.2979, "step": 32636 }, { "epoch": 0.89, "learning_rate": 6.13266368865526e-07, "loss": 1.3142, "step": 32637 }, { "epoch": 0.89, "learning_rate": 6.129614207350443e-07, "loss": 1.0179, "step": 32638 }, { "epoch": 0.89, "learning_rate": 6.12656546044339e-07, "loss": 1.2527, "step": 32639 }, { "epoch": 0.89, "learning_rate": 6.123517447957938e-07, "loss": 1.2979, "step": 32640 }, { "epoch": 0.89, "learning_rate": 6.120470169917936e-07, "loss": 1.3193, "step": 32641 }, { "epoch": 0.89, "learning_rate": 6.117423626347241e-07, "loss": 1.1436, "step": 32642 }, { "epoch": 0.89, "learning_rate": 6.114377817269679e-07, "loss": 1.4429, "step": 32643 }, { "epoch": 0.89, "learning_rate": 6.111332742709076e-07, "loss": 1.4736, "step": 32644 }, { "epoch": 0.89, "learning_rate": 6.108288402689233e-07, "loss": 1.2971, "step": 32645 }, { "epoch": 0.89, "learning_rate": 6.105244797234012e-07, "loss": 1.2417, "step": 32646 }, { "epoch": 0.89, "learning_rate": 6.102201926367201e-07, "loss": 1.3191, "step": 32647 }, { "epoch": 0.89, "learning_rate": 6.099159790112596e-07, "loss": 1.2454, "step": 32648 }, { "epoch": 0.89, "learning_rate": 6.096118388494033e-07, "loss": 1.0891, "step": 32649 }, { "epoch": 0.89, "learning_rate": 6.093077721535268e-07, "loss": 1.1719, "step": 32650 }, { "epoch": 0.89, "learning_rate": 6.090037789260106e-07, "loss": 1.2546, "step": 32651 }, { "epoch": 0.89, "learning_rate": 6.086998591692329e-07, "loss": 1.2021, "step": 32652 }, { "epoch": 0.89, "learning_rate": 6.083960128855715e-07, "loss": 1.1824, "step": 32653 }, { "epoch": 0.89, "learning_rate": 6.080922400774036e-07, "loss": 1.1338, "step": 32654 }, { "epoch": 0.89, "learning_rate": 6.077885407471062e-07, "loss": 1.7437, "step": 32655 }, { "epoch": 0.89, "learning_rate": 6.07484914897053e-07, "loss": 1.3862, "step": 32656 }, { "epoch": 0.89, "learning_rate": 6.071813625296219e-07, "loss": 1.3108, "step": 32657 }, { "epoch": 0.89, "learning_rate": 6.068778836471867e-07, "loss": 1.1973, "step": 32658 }, { "epoch": 0.89, "learning_rate": 6.065744782521243e-07, "loss": 1.2561, "step": 32659 }, { "epoch": 0.89, "learning_rate": 6.06271146346803e-07, "loss": 1.3333, "step": 32660 }, { "epoch": 0.89, "learning_rate": 6.059678879336006e-07, "loss": 1.3535, "step": 32661 }, { "epoch": 0.89, "learning_rate": 6.056647030148865e-07, "loss": 1.2771, "step": 32662 }, { "epoch": 0.89, "learning_rate": 6.053615915930366e-07, "loss": 1.3276, "step": 32663 }, { "epoch": 0.89, "learning_rate": 6.05058553670419e-07, "loss": 1.4263, "step": 32664 }, { "epoch": 0.89, "learning_rate": 6.047555892494039e-07, "loss": 1.2847, "step": 32665 }, { "epoch": 0.89, "learning_rate": 6.044526983323651e-07, "loss": 1.2644, "step": 32666 }, { "epoch": 0.89, "learning_rate": 6.041498809216706e-07, "loss": 1.1384, "step": 32667 }, { "epoch": 0.89, "learning_rate": 6.038471370196886e-07, "loss": 1.2959, "step": 32668 }, { "epoch": 0.89, "learning_rate": 6.03544466628786e-07, "loss": 1.2539, "step": 32669 }, { "epoch": 0.89, "learning_rate": 6.032418697513353e-07, "loss": 1.3245, "step": 32670 }, { "epoch": 0.89, "learning_rate": 6.029393463897015e-07, "loss": 1.3547, "step": 32671 }, { "epoch": 0.89, "learning_rate": 6.026368965462514e-07, "loss": 1.178, "step": 32672 }, { "epoch": 0.89, "learning_rate": 6.023345202233499e-07, "loss": 1.2551, "step": 32673 }, { "epoch": 0.89, "learning_rate": 6.020322174233661e-07, "loss": 1.1082, "step": 32674 }, { "epoch": 0.89, "learning_rate": 6.017299881486627e-07, "loss": 1.2844, "step": 32675 }, { "epoch": 0.89, "learning_rate": 6.014278324016032e-07, "loss": 1.4612, "step": 32676 }, { "epoch": 0.89, "learning_rate": 6.011257501845525e-07, "loss": 1.0359, "step": 32677 }, { "epoch": 0.89, "learning_rate": 6.008237414998764e-07, "loss": 1.249, "step": 32678 }, { "epoch": 0.89, "learning_rate": 6.005218063499341e-07, "loss": 1.3108, "step": 32679 }, { "epoch": 0.89, "learning_rate": 6.002199447370882e-07, "loss": 1.2356, "step": 32680 }, { "epoch": 0.89, "learning_rate": 5.999181566637035e-07, "loss": 1.2529, "step": 32681 }, { "epoch": 0.89, "learning_rate": 5.996164421321382e-07, "loss": 1.2544, "step": 32682 }, { "epoch": 0.89, "learning_rate": 5.993148011447536e-07, "loss": 1.2583, "step": 32683 }, { "epoch": 0.89, "learning_rate": 5.990132337039078e-07, "loss": 1.2866, "step": 32684 }, { "epoch": 0.89, "learning_rate": 5.987117398119636e-07, "loss": 1.1318, "step": 32685 }, { "epoch": 0.89, "learning_rate": 5.984103194712787e-07, "loss": 1.2183, "step": 32686 }, { "epoch": 0.89, "learning_rate": 5.981089726842093e-07, "loss": 1.1401, "step": 32687 }, { "epoch": 0.89, "learning_rate": 5.978076994531135e-07, "loss": 1.3008, "step": 32688 }, { "epoch": 0.89, "learning_rate": 5.975064997803503e-07, "loss": 1.3254, "step": 32689 }, { "epoch": 0.89, "learning_rate": 5.972053736682748e-07, "loss": 1.1536, "step": 32690 }, { "epoch": 0.89, "learning_rate": 5.969043211192427e-07, "loss": 1.1848, "step": 32691 }, { "epoch": 0.89, "learning_rate": 5.966033421356088e-07, "loss": 1.6294, "step": 32692 }, { "epoch": 0.89, "learning_rate": 5.963024367197279e-07, "loss": 1.2349, "step": 32693 }, { "epoch": 0.89, "learning_rate": 5.960016048739581e-07, "loss": 1.3188, "step": 32694 }, { "epoch": 0.89, "learning_rate": 5.957008466006464e-07, "loss": 1.1912, "step": 32695 }, { "epoch": 0.89, "learning_rate": 5.954001619021499e-07, "loss": 1.2544, "step": 32696 }, { "epoch": 0.89, "learning_rate": 5.950995507808199e-07, "loss": 1.1965, "step": 32697 }, { "epoch": 0.89, "learning_rate": 5.947990132390113e-07, "loss": 1.2649, "step": 32698 }, { "epoch": 0.89, "learning_rate": 5.944985492790689e-07, "loss": 1.1707, "step": 32699 }, { "epoch": 0.89, "learning_rate": 5.941981589033497e-07, "loss": 1.1895, "step": 32700 }, { "epoch": 0.89, "learning_rate": 5.938978421141983e-07, "loss": 1.3076, "step": 32701 }, { "epoch": 0.89, "learning_rate": 5.935975989139709e-07, "loss": 1.3223, "step": 32702 }, { "epoch": 0.89, "learning_rate": 5.932974293050098e-07, "loss": 1.3445, "step": 32703 }, { "epoch": 0.89, "learning_rate": 5.929973332896677e-07, "loss": 1.1929, "step": 32704 }, { "epoch": 0.89, "learning_rate": 5.926973108702893e-07, "loss": 1.3315, "step": 32705 }, { "epoch": 0.89, "learning_rate": 5.923973620492273e-07, "loss": 1.2991, "step": 32706 }, { "epoch": 0.89, "learning_rate": 5.92097486828821e-07, "loss": 1.1226, "step": 32707 }, { "epoch": 0.89, "learning_rate": 5.917976852114204e-07, "loss": 1.1726, "step": 32708 }, { "epoch": 0.89, "learning_rate": 5.914979571993707e-07, "loss": 1.1555, "step": 32709 }, { "epoch": 0.89, "learning_rate": 5.911983027950174e-07, "loss": 1.2095, "step": 32710 }, { "epoch": 0.89, "learning_rate": 5.908987220007056e-07, "loss": 1.3276, "step": 32711 }, { "epoch": 0.89, "learning_rate": 5.905992148187745e-07, "loss": 1.2524, "step": 32712 }, { "epoch": 0.89, "learning_rate": 5.902997812515732e-07, "loss": 1.6543, "step": 32713 }, { "epoch": 0.89, "learning_rate": 5.900004213014409e-07, "loss": 1.2163, "step": 32714 }, { "epoch": 0.89, "learning_rate": 5.897011349707216e-07, "loss": 1.2383, "step": 32715 }, { "epoch": 0.89, "learning_rate": 5.894019222617531e-07, "loss": 1.3293, "step": 32716 }, { "epoch": 0.89, "learning_rate": 5.891027831768803e-07, "loss": 1.1189, "step": 32717 }, { "epoch": 0.89, "learning_rate": 5.888037177184425e-07, "loss": 1.2129, "step": 32718 }, { "epoch": 0.89, "learning_rate": 5.885047258887777e-07, "loss": 1.3218, "step": 32719 }, { "epoch": 0.89, "learning_rate": 5.882058076902264e-07, "loss": 1.3152, "step": 32720 }, { "epoch": 0.89, "learning_rate": 5.879069631251277e-07, "loss": 1.5476, "step": 32721 }, { "epoch": 0.89, "learning_rate": 5.876081921958199e-07, "loss": 1.2322, "step": 32722 }, { "epoch": 0.89, "learning_rate": 5.873094949046387e-07, "loss": 1.3115, "step": 32723 }, { "epoch": 0.89, "learning_rate": 5.870108712539203e-07, "loss": 1.3726, "step": 32724 }, { "epoch": 0.89, "learning_rate": 5.867123212460047e-07, "loss": 1.3022, "step": 32725 }, { "epoch": 0.89, "learning_rate": 5.864138448832246e-07, "loss": 1.2703, "step": 32726 }, { "epoch": 0.89, "learning_rate": 5.86115442167916e-07, "loss": 1.311, "step": 32727 }, { "epoch": 0.89, "learning_rate": 5.858171131024137e-07, "loss": 1.3313, "step": 32728 }, { "epoch": 0.89, "learning_rate": 5.855188576890514e-07, "loss": 1.1711, "step": 32729 }, { "epoch": 0.89, "learning_rate": 5.852206759301638e-07, "loss": 1.7666, "step": 32730 }, { "epoch": 0.89, "learning_rate": 5.849225678280801e-07, "loss": 1.3303, "step": 32731 }, { "epoch": 0.89, "learning_rate": 5.846245333851364e-07, "loss": 1.343, "step": 32732 }, { "epoch": 0.89, "learning_rate": 5.843265726036629e-07, "loss": 1.1631, "step": 32733 }, { "epoch": 0.89, "learning_rate": 5.8402868548599e-07, "loss": 1.1726, "step": 32734 }, { "epoch": 0.89, "learning_rate": 5.837308720344492e-07, "loss": 1.2605, "step": 32735 }, { "epoch": 0.89, "learning_rate": 5.834331322513709e-07, "loss": 1.3616, "step": 32736 }, { "epoch": 0.89, "learning_rate": 5.831354661390831e-07, "loss": 1.2422, "step": 32737 }, { "epoch": 0.89, "learning_rate": 5.828378736999163e-07, "loss": 1.1453, "step": 32738 }, { "epoch": 0.89, "learning_rate": 5.825403549361952e-07, "loss": 1.4517, "step": 32739 }, { "epoch": 0.89, "learning_rate": 5.822429098502514e-07, "loss": 1.2156, "step": 32740 }, { "epoch": 0.89, "learning_rate": 5.819455384444117e-07, "loss": 1.2896, "step": 32741 }, { "epoch": 0.89, "learning_rate": 5.81648240721e-07, "loss": 1.3586, "step": 32742 }, { "epoch": 0.89, "learning_rate": 5.813510166823444e-07, "loss": 1.2666, "step": 32743 }, { "epoch": 0.89, "learning_rate": 5.810538663307686e-07, "loss": 1.2764, "step": 32744 }, { "epoch": 0.89, "learning_rate": 5.807567896686007e-07, "loss": 1.2395, "step": 32745 }, { "epoch": 0.89, "learning_rate": 5.804597866981598e-07, "loss": 1.24, "step": 32746 }, { "epoch": 0.89, "learning_rate": 5.801628574217733e-07, "loss": 1.1619, "step": 32747 }, { "epoch": 0.89, "learning_rate": 5.798660018417612e-07, "loss": 1.0759, "step": 32748 }, { "epoch": 0.89, "learning_rate": 5.795692199604519e-07, "loss": 1.2263, "step": 32749 }, { "epoch": 0.89, "learning_rate": 5.79272511780159e-07, "loss": 1.3625, "step": 32750 }, { "epoch": 0.89, "learning_rate": 5.789758773032106e-07, "loss": 1.1975, "step": 32751 }, { "epoch": 0.89, "learning_rate": 5.786793165319227e-07, "loss": 1.1609, "step": 32752 }, { "epoch": 0.89, "learning_rate": 5.783828294686211e-07, "loss": 1.3928, "step": 32753 }, { "epoch": 0.89, "learning_rate": 5.780864161156186e-07, "loss": 1.1133, "step": 32754 }, { "epoch": 0.89, "learning_rate": 5.777900764752376e-07, "loss": 1.3293, "step": 32755 }, { "epoch": 0.89, "learning_rate": 5.774938105497974e-07, "loss": 1.2048, "step": 32756 }, { "epoch": 0.89, "learning_rate": 5.771976183416161e-07, "loss": 1.2688, "step": 32757 }, { "epoch": 0.89, "learning_rate": 5.769014998530087e-07, "loss": 1.1582, "step": 32758 }, { "epoch": 0.89, "learning_rate": 5.76605455086291e-07, "loss": 1.249, "step": 32759 }, { "epoch": 0.89, "learning_rate": 5.763094840437833e-07, "loss": 0.9781, "step": 32760 }, { "epoch": 0.89, "learning_rate": 5.760135867277994e-07, "loss": 1.2075, "step": 32761 }, { "epoch": 0.89, "learning_rate": 5.75717763140653e-07, "loss": 1.2139, "step": 32762 }, { "epoch": 0.89, "learning_rate": 5.754220132846578e-07, "loss": 1.1663, "step": 32763 }, { "epoch": 0.89, "learning_rate": 5.751263371621297e-07, "loss": 1.2659, "step": 32764 }, { "epoch": 0.89, "learning_rate": 5.748307347753823e-07, "loss": 1.2642, "step": 32765 }, { "epoch": 0.89, "learning_rate": 5.745352061267273e-07, "loss": 1.3706, "step": 32766 }, { "epoch": 0.89, "learning_rate": 5.742397512184749e-07, "loss": 1.3215, "step": 32767 }, { "epoch": 0.89, "learning_rate": 5.73944370052939e-07, "loss": 1.2686, "step": 32768 }, { "epoch": 0.89, "learning_rate": 5.736490626324309e-07, "loss": 1.1694, "step": 32769 }, { "epoch": 0.89, "learning_rate": 5.733538289592599e-07, "loss": 1.2058, "step": 32770 }, { "epoch": 0.89, "learning_rate": 5.730586690357343e-07, "loss": 1.2034, "step": 32771 }, { "epoch": 0.89, "learning_rate": 5.727635828641665e-07, "loss": 1.2417, "step": 32772 }, { "epoch": 0.9, "learning_rate": 5.724685704468624e-07, "loss": 1.7793, "step": 32773 }, { "epoch": 0.9, "learning_rate": 5.721736317861304e-07, "loss": 1.167, "step": 32774 }, { "epoch": 0.9, "learning_rate": 5.718787668842807e-07, "loss": 1.3457, "step": 32775 }, { "epoch": 0.9, "learning_rate": 5.715839757436171e-07, "loss": 1.3606, "step": 32776 }, { "epoch": 0.9, "learning_rate": 5.712892583664476e-07, "loss": 1.2441, "step": 32777 }, { "epoch": 0.9, "learning_rate": 5.709946147550749e-07, "loss": 1.2593, "step": 32778 }, { "epoch": 0.9, "learning_rate": 5.707000449118083e-07, "loss": 1.1443, "step": 32779 }, { "epoch": 0.9, "learning_rate": 5.704055488389515e-07, "loss": 1.2917, "step": 32780 }, { "epoch": 0.9, "learning_rate": 5.70111126538806e-07, "loss": 1.1018, "step": 32781 }, { "epoch": 0.9, "learning_rate": 5.698167780136765e-07, "loss": 1.2397, "step": 32782 }, { "epoch": 0.9, "learning_rate": 5.695225032658669e-07, "loss": 1.3818, "step": 32783 }, { "epoch": 0.9, "learning_rate": 5.692283022976796e-07, "loss": 0.9897, "step": 32784 }, { "epoch": 0.9, "learning_rate": 5.689341751114153e-07, "loss": 1.2397, "step": 32785 }, { "epoch": 0.9, "learning_rate": 5.686401217093728e-07, "loss": 1.3904, "step": 32786 }, { "epoch": 0.9, "learning_rate": 5.683461420938563e-07, "loss": 1.1475, "step": 32787 }, { "epoch": 0.9, "learning_rate": 5.680522362671659e-07, "loss": 1.0924, "step": 32788 }, { "epoch": 0.9, "learning_rate": 5.677584042315975e-07, "loss": 1.436, "step": 32789 }, { "epoch": 0.9, "learning_rate": 5.67464645989454e-07, "loss": 1.2786, "step": 32790 }, { "epoch": 0.9, "learning_rate": 5.671709615430298e-07, "loss": 1.1157, "step": 32791 }, { "epoch": 0.9, "learning_rate": 5.668773508946268e-07, "loss": 1.252, "step": 32792 }, { "epoch": 0.9, "learning_rate": 5.665838140465374e-07, "loss": 1.157, "step": 32793 }, { "epoch": 0.9, "learning_rate": 5.662903510010609e-07, "loss": 1.1499, "step": 32794 }, { "epoch": 0.9, "learning_rate": 5.659969617604922e-07, "loss": 1.4097, "step": 32795 }, { "epoch": 0.9, "learning_rate": 5.657036463271292e-07, "loss": 1.7378, "step": 32796 }, { "epoch": 0.9, "learning_rate": 5.654104047032616e-07, "loss": 1.2693, "step": 32797 }, { "epoch": 0.9, "learning_rate": 5.651172368911884e-07, "loss": 1.3291, "step": 32798 }, { "epoch": 0.9, "learning_rate": 5.648241428931999e-07, "loss": 1.3079, "step": 32799 }, { "epoch": 0.9, "learning_rate": 5.645311227115935e-07, "loss": 1.2913, "step": 32800 }, { "epoch": 0.9, "learning_rate": 5.642381763486559e-07, "loss": 1.1128, "step": 32801 }, { "epoch": 0.9, "learning_rate": 5.639453038066822e-07, "loss": 1.1921, "step": 32802 }, { "epoch": 0.9, "learning_rate": 5.636525050879637e-07, "loss": 1.2546, "step": 32803 }, { "epoch": 0.9, "learning_rate": 5.63359780194791e-07, "loss": 1.4246, "step": 32804 }, { "epoch": 0.9, "learning_rate": 5.630671291294543e-07, "loss": 1.3386, "step": 32805 }, { "epoch": 0.9, "learning_rate": 5.627745518942418e-07, "loss": 1.2847, "step": 32806 }, { "epoch": 0.9, "learning_rate": 5.62482048491444e-07, "loss": 1.1659, "step": 32807 }, { "epoch": 0.9, "learning_rate": 5.621896189233488e-07, "loss": 1.2385, "step": 32808 }, { "epoch": 0.9, "learning_rate": 5.618972631922448e-07, "loss": 1.3142, "step": 32809 }, { "epoch": 0.9, "learning_rate": 5.616049813004166e-07, "loss": 1.2478, "step": 32810 }, { "epoch": 0.9, "learning_rate": 5.613127732501544e-07, "loss": 1.3113, "step": 32811 }, { "epoch": 0.9, "learning_rate": 5.610206390437433e-07, "loss": 1.2209, "step": 32812 }, { "epoch": 0.9, "learning_rate": 5.607285786834671e-07, "loss": 1.2866, "step": 32813 }, { "epoch": 0.9, "learning_rate": 5.604365921716116e-07, "loss": 1.3906, "step": 32814 }, { "epoch": 0.9, "learning_rate": 5.601446795104615e-07, "loss": 1.2019, "step": 32815 }, { "epoch": 0.9, "learning_rate": 5.598528407023007e-07, "loss": 1.2351, "step": 32816 }, { "epoch": 0.9, "learning_rate": 5.59561075749413e-07, "loss": 1.3398, "step": 32817 }, { "epoch": 0.9, "learning_rate": 5.592693846540786e-07, "loss": 1.4146, "step": 32818 }, { "epoch": 0.9, "learning_rate": 5.589777674185826e-07, "loss": 1.2725, "step": 32819 }, { "epoch": 0.9, "learning_rate": 5.586862240452051e-07, "loss": 1.2256, "step": 32820 }, { "epoch": 0.9, "learning_rate": 5.583947545362245e-07, "loss": 1.1251, "step": 32821 }, { "epoch": 0.9, "learning_rate": 5.581033588939266e-07, "loss": 1.142, "step": 32822 }, { "epoch": 0.9, "learning_rate": 5.578120371205875e-07, "loss": 1.3318, "step": 32823 }, { "epoch": 0.9, "learning_rate": 5.575207892184864e-07, "loss": 1.3542, "step": 32824 }, { "epoch": 0.9, "learning_rate": 5.572296151899015e-07, "loss": 1.27, "step": 32825 }, { "epoch": 0.9, "learning_rate": 5.569385150371131e-07, "loss": 1.7166, "step": 32826 }, { "epoch": 0.9, "learning_rate": 5.566474887623974e-07, "loss": 1.0647, "step": 32827 }, { "epoch": 0.9, "learning_rate": 5.563565363680312e-07, "loss": 1.3025, "step": 32828 }, { "epoch": 0.9, "learning_rate": 5.560656578562895e-07, "loss": 1.2666, "step": 32829 }, { "epoch": 0.9, "learning_rate": 5.557748532294505e-07, "loss": 1.1975, "step": 32830 }, { "epoch": 0.9, "learning_rate": 5.554841224897878e-07, "loss": 1.1953, "step": 32831 }, { "epoch": 0.9, "learning_rate": 5.551934656395774e-07, "loss": 1.1586, "step": 32832 }, { "epoch": 0.9, "learning_rate": 5.549028826810888e-07, "loss": 1.2417, "step": 32833 }, { "epoch": 0.9, "learning_rate": 5.546123736165998e-07, "loss": 1.1726, "step": 32834 }, { "epoch": 0.9, "learning_rate": 5.543219384483844e-07, "loss": 1.1648, "step": 32835 }, { "epoch": 0.9, "learning_rate": 5.540315771787108e-07, "loss": 1.3406, "step": 32836 }, { "epoch": 0.9, "learning_rate": 5.537412898098526e-07, "loss": 1.0586, "step": 32837 }, { "epoch": 0.9, "learning_rate": 5.534510763440792e-07, "loss": 1.2356, "step": 32838 }, { "epoch": 0.9, "learning_rate": 5.531609367836655e-07, "loss": 1.285, "step": 32839 }, { "epoch": 0.9, "learning_rate": 5.528708711308762e-07, "loss": 1.4442, "step": 32840 }, { "epoch": 0.9, "learning_rate": 5.525808793879839e-07, "loss": 1.1462, "step": 32841 }, { "epoch": 0.9, "learning_rate": 5.522909615572547e-07, "loss": 1.1958, "step": 32842 }, { "epoch": 0.9, "learning_rate": 5.520011176409612e-07, "loss": 1.2852, "step": 32843 }, { "epoch": 0.9, "learning_rate": 5.517113476413649e-07, "loss": 1.1348, "step": 32844 }, { "epoch": 0.9, "learning_rate": 5.514216515607385e-07, "loss": 1.3494, "step": 32845 }, { "epoch": 0.9, "learning_rate": 5.511320294013433e-07, "loss": 1.1636, "step": 32846 }, { "epoch": 0.9, "learning_rate": 5.508424811654522e-07, "loss": 1.2773, "step": 32847 }, { "epoch": 0.9, "learning_rate": 5.505530068553234e-07, "loss": 1.2117, "step": 32848 }, { "epoch": 0.9, "learning_rate": 5.502636064732236e-07, "loss": 1.2737, "step": 32849 }, { "epoch": 0.9, "learning_rate": 5.499742800214191e-07, "loss": 1.416, "step": 32850 }, { "epoch": 0.9, "learning_rate": 5.496850275021726e-07, "loss": 1.2859, "step": 32851 }, { "epoch": 0.9, "learning_rate": 5.493958489177465e-07, "loss": 1.3599, "step": 32852 }, { "epoch": 0.9, "learning_rate": 5.491067442704023e-07, "loss": 1.3865, "step": 32853 }, { "epoch": 0.9, "learning_rate": 5.488177135624029e-07, "loss": 1.2803, "step": 32854 }, { "epoch": 0.9, "learning_rate": 5.485287567960107e-07, "loss": 1.2134, "step": 32855 }, { "epoch": 0.9, "learning_rate": 5.482398739734851e-07, "loss": 1.0596, "step": 32856 }, { "epoch": 0.9, "learning_rate": 5.479510650970843e-07, "loss": 1.3606, "step": 32857 }, { "epoch": 0.9, "learning_rate": 5.476623301690709e-07, "loss": 1.1414, "step": 32858 }, { "epoch": 0.9, "learning_rate": 5.473736691917031e-07, "loss": 1.3059, "step": 32859 }, { "epoch": 0.9, "learning_rate": 5.470850821672391e-07, "loss": 1.1526, "step": 32860 }, { "epoch": 0.9, "learning_rate": 5.467965690979338e-07, "loss": 1.3577, "step": 32861 }, { "epoch": 0.9, "learning_rate": 5.465081299860497e-07, "loss": 1.2068, "step": 32862 }, { "epoch": 0.9, "learning_rate": 5.462197648338396e-07, "loss": 1.1646, "step": 32863 }, { "epoch": 0.9, "learning_rate": 5.459314736435595e-07, "loss": 1.6577, "step": 32864 }, { "epoch": 0.9, "learning_rate": 5.456432564174674e-07, "loss": 1.1472, "step": 32865 }, { "epoch": 0.9, "learning_rate": 5.453551131578161e-07, "loss": 1.2634, "step": 32866 }, { "epoch": 0.9, "learning_rate": 5.450670438668615e-07, "loss": 1.1826, "step": 32867 }, { "epoch": 0.9, "learning_rate": 5.447790485468551e-07, "loss": 1.3684, "step": 32868 }, { "epoch": 0.9, "learning_rate": 5.44491127200052e-07, "loss": 1.2925, "step": 32869 }, { "epoch": 0.9, "learning_rate": 5.442032798287033e-07, "loss": 1.1538, "step": 32870 }, { "epoch": 0.9, "learning_rate": 5.439155064350631e-07, "loss": 1.2227, "step": 32871 }, { "epoch": 0.9, "learning_rate": 5.436278070213796e-07, "loss": 1.2642, "step": 32872 }, { "epoch": 0.9, "learning_rate": 5.433401815899065e-07, "loss": 1.3164, "step": 32873 }, { "epoch": 0.9, "learning_rate": 5.430526301428929e-07, "loss": 1.2234, "step": 32874 }, { "epoch": 0.9, "learning_rate": 5.427651526825895e-07, "loss": 1.2644, "step": 32875 }, { "epoch": 0.9, "learning_rate": 5.42477749211242e-07, "loss": 1.2283, "step": 32876 }, { "epoch": 0.9, "learning_rate": 5.421904197311034e-07, "loss": 1.3918, "step": 32877 }, { "epoch": 0.9, "learning_rate": 5.419031642444183e-07, "loss": 1.293, "step": 32878 }, { "epoch": 0.9, "learning_rate": 5.416159827534373e-07, "loss": 1.2568, "step": 32879 }, { "epoch": 0.9, "learning_rate": 5.413288752604028e-07, "loss": 1.333, "step": 32880 }, { "epoch": 0.9, "learning_rate": 5.410418417675634e-07, "loss": 1.3638, "step": 32881 }, { "epoch": 0.9, "learning_rate": 5.407548822771669e-07, "loss": 1.1233, "step": 32882 }, { "epoch": 0.9, "learning_rate": 5.404679967914539e-07, "loss": 1.1453, "step": 32883 }, { "epoch": 0.9, "learning_rate": 5.401811853126727e-07, "loss": 1.3228, "step": 32884 }, { "epoch": 0.9, "learning_rate": 5.398944478430646e-07, "loss": 1.2517, "step": 32885 }, { "epoch": 0.9, "learning_rate": 5.396077843848757e-07, "loss": 1.1801, "step": 32886 }, { "epoch": 0.9, "learning_rate": 5.393211949403443e-07, "loss": 1.1719, "step": 32887 }, { "epoch": 0.9, "learning_rate": 5.390346795117174e-07, "loss": 1.2363, "step": 32888 }, { "epoch": 0.9, "learning_rate": 5.387482381012321e-07, "loss": 1.2468, "step": 32889 }, { "epoch": 0.9, "learning_rate": 5.384618707111334e-07, "loss": 1.2419, "step": 32890 }, { "epoch": 0.9, "learning_rate": 5.381755773436592e-07, "loss": 1.1216, "step": 32891 }, { "epoch": 0.9, "learning_rate": 5.378893580010514e-07, "loss": 1.4478, "step": 32892 }, { "epoch": 0.9, "learning_rate": 5.376032126855457e-07, "loss": 1.1873, "step": 32893 }, { "epoch": 0.9, "learning_rate": 5.373171413993838e-07, "loss": 1.1555, "step": 32894 }, { "epoch": 0.9, "learning_rate": 5.37031144144804e-07, "loss": 1.2244, "step": 32895 }, { "epoch": 0.9, "learning_rate": 5.367452209240398e-07, "loss": 1.2488, "step": 32896 }, { "epoch": 0.9, "learning_rate": 5.364593717393341e-07, "loss": 1.283, "step": 32897 }, { "epoch": 0.9, "learning_rate": 5.361735965929193e-07, "loss": 1.2817, "step": 32898 }, { "epoch": 0.9, "learning_rate": 5.358878954870317e-07, "loss": 1.1792, "step": 32899 }, { "epoch": 0.9, "learning_rate": 5.35602268423906e-07, "loss": 1.3401, "step": 32900 }, { "epoch": 0.9, "learning_rate": 5.353167154057792e-07, "loss": 1.2312, "step": 32901 }, { "epoch": 0.9, "learning_rate": 5.350312364348842e-07, "loss": 1.6948, "step": 32902 }, { "epoch": 0.9, "learning_rate": 5.347458315134535e-07, "loss": 1.425, "step": 32903 }, { "epoch": 0.9, "learning_rate": 5.344605006437187e-07, "loss": 1.2712, "step": 32904 }, { "epoch": 0.9, "learning_rate": 5.341752438279157e-07, "loss": 1.2979, "step": 32905 }, { "epoch": 0.9, "learning_rate": 5.338900610682751e-07, "loss": 1.2729, "step": 32906 }, { "epoch": 0.9, "learning_rate": 5.336049523670262e-07, "loss": 1.1837, "step": 32907 }, { "epoch": 0.9, "learning_rate": 5.333199177264004e-07, "loss": 1.269, "step": 32908 }, { "epoch": 0.9, "learning_rate": 5.330349571486293e-07, "loss": 1.293, "step": 32909 }, { "epoch": 0.9, "learning_rate": 5.327500706359401e-07, "loss": 1.2971, "step": 32910 }, { "epoch": 0.9, "learning_rate": 5.32465258190562e-07, "loss": 1.2966, "step": 32911 }, { "epoch": 0.9, "learning_rate": 5.321805198147245e-07, "loss": 1.2437, "step": 32912 }, { "epoch": 0.9, "learning_rate": 5.318958555106557e-07, "loss": 1.1995, "step": 32913 }, { "epoch": 0.9, "learning_rate": 5.316112652805805e-07, "loss": 1.1218, "step": 32914 }, { "epoch": 0.9, "learning_rate": 5.313267491267249e-07, "loss": 1.355, "step": 32915 }, { "epoch": 0.9, "learning_rate": 5.310423070513183e-07, "loss": 1.3201, "step": 32916 }, { "epoch": 0.9, "learning_rate": 5.307579390565842e-07, "loss": 1.6758, "step": 32917 }, { "epoch": 0.9, "learning_rate": 5.304736451447468e-07, "loss": 1.3831, "step": 32918 }, { "epoch": 0.9, "learning_rate": 5.301894253180295e-07, "loss": 1.3718, "step": 32919 }, { "epoch": 0.9, "learning_rate": 5.299052795786586e-07, "loss": 1.2893, "step": 32920 }, { "epoch": 0.9, "learning_rate": 5.296212079288543e-07, "loss": 1.2441, "step": 32921 }, { "epoch": 0.9, "learning_rate": 5.293372103708427e-07, "loss": 1.272, "step": 32922 }, { "epoch": 0.9, "learning_rate": 5.29053286906841e-07, "loss": 1.261, "step": 32923 }, { "epoch": 0.9, "learning_rate": 5.287694375390739e-07, "loss": 1.3625, "step": 32924 }, { "epoch": 0.9, "learning_rate": 5.284856622697599e-07, "loss": 1.2102, "step": 32925 }, { "epoch": 0.9, "learning_rate": 5.282019611011213e-07, "loss": 1.1975, "step": 32926 }, { "epoch": 0.9, "learning_rate": 5.279183340353766e-07, "loss": 1.1536, "step": 32927 }, { "epoch": 0.9, "learning_rate": 5.27634781074744e-07, "loss": 1.178, "step": 32928 }, { "epoch": 0.9, "learning_rate": 5.273513022214438e-07, "loss": 1.2764, "step": 32929 }, { "epoch": 0.9, "learning_rate": 5.270678974776922e-07, "loss": 1.2285, "step": 32930 }, { "epoch": 0.9, "learning_rate": 5.267845668457072e-07, "loss": 1.3142, "step": 32931 }, { "epoch": 0.9, "learning_rate": 5.265013103277039e-07, "loss": 1.2322, "step": 32932 }, { "epoch": 0.9, "learning_rate": 5.262181279259015e-07, "loss": 1.2954, "step": 32933 }, { "epoch": 0.9, "learning_rate": 5.259350196425128e-07, "loss": 1.397, "step": 32934 }, { "epoch": 0.9, "learning_rate": 5.256519854797537e-07, "loss": 1.345, "step": 32935 }, { "epoch": 0.9, "learning_rate": 5.25369025439837e-07, "loss": 1.188, "step": 32936 }, { "epoch": 0.9, "learning_rate": 5.250861395249785e-07, "loss": 1.3962, "step": 32937 }, { "epoch": 0.9, "learning_rate": 5.248033277373909e-07, "loss": 1.0891, "step": 32938 }, { "epoch": 0.9, "learning_rate": 5.245205900792871e-07, "loss": 1.2944, "step": 32939 }, { "epoch": 0.9, "learning_rate": 5.242379265528763e-07, "loss": 1.4258, "step": 32940 }, { "epoch": 0.9, "learning_rate": 5.239553371603745e-07, "loss": 1.1597, "step": 32941 }, { "epoch": 0.9, "learning_rate": 5.236728219039899e-07, "loss": 1.0675, "step": 32942 }, { "epoch": 0.9, "learning_rate": 5.233903807859308e-07, "loss": 1.2654, "step": 32943 }, { "epoch": 0.9, "learning_rate": 5.231080138084111e-07, "loss": 1.1055, "step": 32944 }, { "epoch": 0.9, "learning_rate": 5.228257209736387e-07, "loss": 1.6914, "step": 32945 }, { "epoch": 0.9, "learning_rate": 5.22543502283821e-07, "loss": 1.3181, "step": 32946 }, { "epoch": 0.9, "learning_rate": 5.22261357741164e-07, "loss": 1.2537, "step": 32947 }, { "epoch": 0.9, "learning_rate": 5.21979287347879e-07, "loss": 1.2151, "step": 32948 }, { "epoch": 0.9, "learning_rate": 5.216972911061724e-07, "loss": 1.0034, "step": 32949 }, { "epoch": 0.9, "learning_rate": 5.214153690182478e-07, "loss": 1.2417, "step": 32950 }, { "epoch": 0.9, "learning_rate": 5.211335210863123e-07, "loss": 1.1036, "step": 32951 }, { "epoch": 0.9, "learning_rate": 5.208517473125707e-07, "loss": 1.1158, "step": 32952 }, { "epoch": 0.9, "learning_rate": 5.205700476992282e-07, "loss": 1.2966, "step": 32953 }, { "epoch": 0.9, "learning_rate": 5.202884222484883e-07, "loss": 1.281, "step": 32954 }, { "epoch": 0.9, "learning_rate": 5.200068709625527e-07, "loss": 1.2688, "step": 32955 }, { "epoch": 0.9, "learning_rate": 5.197253938436275e-07, "loss": 1.1001, "step": 32956 }, { "epoch": 0.9, "learning_rate": 5.19443990893912e-07, "loss": 1.1758, "step": 32957 }, { "epoch": 0.9, "learning_rate": 5.191626621156076e-07, "loss": 1.1931, "step": 32958 }, { "epoch": 0.9, "learning_rate": 5.188814075109172e-07, "loss": 1.2659, "step": 32959 }, { "epoch": 0.9, "learning_rate": 5.186002270820389e-07, "loss": 1.2322, "step": 32960 }, { "epoch": 0.9, "learning_rate": 5.183191208311777e-07, "loss": 1.1808, "step": 32961 }, { "epoch": 0.9, "learning_rate": 5.180380887605252e-07, "loss": 1.3301, "step": 32962 }, { "epoch": 0.9, "learning_rate": 5.177571308722861e-07, "loss": 1.3335, "step": 32963 }, { "epoch": 0.9, "learning_rate": 5.174762471686556e-07, "loss": 1.2856, "step": 32964 }, { "epoch": 0.9, "learning_rate": 5.17195437651834e-07, "loss": 1.1152, "step": 32965 }, { "epoch": 0.9, "learning_rate": 5.169147023240128e-07, "loss": 1.2358, "step": 32966 }, { "epoch": 0.9, "learning_rate": 5.166340411873938e-07, "loss": 1.2151, "step": 32967 }, { "epoch": 0.9, "learning_rate": 5.163534542441683e-07, "loss": 1.4893, "step": 32968 }, { "epoch": 0.9, "learning_rate": 5.160729414965381e-07, "loss": 1.166, "step": 32969 }, { "epoch": 0.9, "learning_rate": 5.157925029466904e-07, "loss": 1.2529, "step": 32970 }, { "epoch": 0.9, "learning_rate": 5.155121385968232e-07, "loss": 1.2185, "step": 32971 }, { "epoch": 0.9, "learning_rate": 5.152318484491281e-07, "loss": 1.3633, "step": 32972 }, { "epoch": 0.9, "learning_rate": 5.149516325058001e-07, "loss": 1.1863, "step": 32973 }, { "epoch": 0.9, "learning_rate": 5.146714907690297e-07, "loss": 1.3391, "step": 32974 }, { "epoch": 0.9, "learning_rate": 5.143914232410097e-07, "loss": 1.1785, "step": 32975 }, { "epoch": 0.9, "learning_rate": 5.141114299239302e-07, "loss": 1.1115, "step": 32976 }, { "epoch": 0.9, "learning_rate": 5.138315108199832e-07, "loss": 1.3169, "step": 32977 }, { "epoch": 0.9, "learning_rate": 5.135516659313578e-07, "loss": 1.2551, "step": 32978 }, { "epoch": 0.9, "learning_rate": 5.132718952602422e-07, "loss": 1.3374, "step": 32979 }, { "epoch": 0.9, "learning_rate": 5.129921988088271e-07, "loss": 1.343, "step": 32980 }, { "epoch": 0.9, "learning_rate": 5.127125765793006e-07, "loss": 1.209, "step": 32981 }, { "epoch": 0.9, "learning_rate": 5.124330285738488e-07, "loss": 1.3071, "step": 32982 }, { "epoch": 0.9, "learning_rate": 5.121535547946588e-07, "loss": 1.4041, "step": 32983 }, { "epoch": 0.9, "learning_rate": 5.118741552439188e-07, "loss": 1.0426, "step": 32984 }, { "epoch": 0.9, "learning_rate": 5.115948299238149e-07, "loss": 1.4126, "step": 32985 }, { "epoch": 0.9, "learning_rate": 5.113155788365298e-07, "loss": 1.1597, "step": 32986 }, { "epoch": 0.9, "learning_rate": 5.110364019842495e-07, "loss": 1.772, "step": 32987 }, { "epoch": 0.9, "learning_rate": 5.107572993691589e-07, "loss": 1.231, "step": 32988 }, { "epoch": 0.9, "learning_rate": 5.104782709934419e-07, "loss": 1.2651, "step": 32989 }, { "epoch": 0.9, "learning_rate": 5.101993168592789e-07, "loss": 1.2041, "step": 32990 }, { "epoch": 0.9, "learning_rate": 5.099204369688548e-07, "loss": 1.2371, "step": 32991 }, { "epoch": 0.9, "learning_rate": 5.096416313243512e-07, "loss": 1.0928, "step": 32992 }, { "epoch": 0.9, "learning_rate": 5.093628999279488e-07, "loss": 1.3408, "step": 32993 }, { "epoch": 0.9, "learning_rate": 5.090842427818266e-07, "loss": 1.1072, "step": 32994 }, { "epoch": 0.9, "learning_rate": 5.088056598881686e-07, "loss": 1.6958, "step": 32995 }, { "epoch": 0.9, "learning_rate": 5.085271512491507e-07, "loss": 0.9866, "step": 32996 }, { "epoch": 0.9, "learning_rate": 5.082487168669536e-07, "loss": 1.4087, "step": 32997 }, { "epoch": 0.9, "learning_rate": 5.079703567437544e-07, "loss": 1.5942, "step": 32998 }, { "epoch": 0.9, "learning_rate": 5.076920708817334e-07, "loss": 1.4036, "step": 32999 }, { "epoch": 0.9, "learning_rate": 5.074138592830646e-07, "loss": 1.2725, "step": 33000 }, { "epoch": 0.9, "learning_rate": 5.071357219499273e-07, "loss": 1.3223, "step": 33001 }, { "epoch": 0.9, "learning_rate": 5.068576588844943e-07, "loss": 1.1943, "step": 33002 }, { "epoch": 0.9, "learning_rate": 5.065796700889447e-07, "loss": 1.2207, "step": 33003 }, { "epoch": 0.9, "learning_rate": 5.063017555654503e-07, "loss": 1.7183, "step": 33004 }, { "epoch": 0.9, "learning_rate": 5.060239153161872e-07, "loss": 1.2222, "step": 33005 }, { "epoch": 0.9, "learning_rate": 5.057461493433291e-07, "loss": 1.3311, "step": 33006 }, { "epoch": 0.9, "learning_rate": 5.054684576490476e-07, "loss": 1.7134, "step": 33007 }, { "epoch": 0.9, "learning_rate": 5.051908402355187e-07, "loss": 1.3862, "step": 33008 }, { "epoch": 0.9, "learning_rate": 5.049132971049086e-07, "loss": 1.2634, "step": 33009 }, { "epoch": 0.9, "learning_rate": 5.046358282593944e-07, "loss": 1.3005, "step": 33010 }, { "epoch": 0.9, "learning_rate": 5.04358433701142e-07, "loss": 1.2568, "step": 33011 }, { "epoch": 0.9, "learning_rate": 5.040811134323276e-07, "loss": 1.2773, "step": 33012 }, { "epoch": 0.9, "learning_rate": 5.038038674551138e-07, "loss": 1.3574, "step": 33013 }, { "epoch": 0.9, "learning_rate": 5.035266957716756e-07, "loss": 1.3232, "step": 33014 }, { "epoch": 0.9, "learning_rate": 5.032495983841768e-07, "loss": 1.21, "step": 33015 }, { "epoch": 0.9, "learning_rate": 5.0297257529479e-07, "loss": 1.1252, "step": 33016 }, { "epoch": 0.9, "learning_rate": 5.026956265056781e-07, "loss": 1.3701, "step": 33017 }, { "epoch": 0.9, "learning_rate": 5.024187520190105e-07, "loss": 1.3408, "step": 33018 }, { "epoch": 0.9, "learning_rate": 5.021419518369508e-07, "loss": 1.0918, "step": 33019 }, { "epoch": 0.9, "learning_rate": 5.018652259616686e-07, "loss": 1.0989, "step": 33020 }, { "epoch": 0.9, "learning_rate": 5.015885743953253e-07, "loss": 1.2673, "step": 33021 }, { "epoch": 0.9, "learning_rate": 5.01311997140086e-07, "loss": 1.2793, "step": 33022 }, { "epoch": 0.9, "learning_rate": 5.010354941981166e-07, "loss": 1.3306, "step": 33023 }, { "epoch": 0.9, "learning_rate": 5.007590655715777e-07, "loss": 1.3062, "step": 33024 }, { "epoch": 0.9, "learning_rate": 5.004827112626343e-07, "loss": 1.1575, "step": 33025 }, { "epoch": 0.9, "learning_rate": 5.002064312734456e-07, "loss": 1.2974, "step": 33026 }, { "epoch": 0.9, "learning_rate": 4.999302256061756e-07, "loss": 1.2778, "step": 33027 }, { "epoch": 0.9, "learning_rate": 4.996540942629835e-07, "loss": 1.1636, "step": 33028 }, { "epoch": 0.9, "learning_rate": 4.993780372460311e-07, "loss": 1.239, "step": 33029 }, { "epoch": 0.9, "learning_rate": 4.991020545574765e-07, "loss": 1.0918, "step": 33030 }, { "epoch": 0.9, "learning_rate": 4.988261461994814e-07, "loss": 1.3438, "step": 33031 }, { "epoch": 0.9, "learning_rate": 4.985503121742019e-07, "loss": 1.2578, "step": 33032 }, { "epoch": 0.9, "learning_rate": 4.982745524837973e-07, "loss": 1.468, "step": 33033 }, { "epoch": 0.9, "learning_rate": 4.979988671304226e-07, "loss": 1.3716, "step": 33034 }, { "epoch": 0.9, "learning_rate": 4.977232561162382e-07, "loss": 1.1584, "step": 33035 }, { "epoch": 0.9, "learning_rate": 4.974477194433991e-07, "loss": 1.2297, "step": 33036 }, { "epoch": 0.9, "learning_rate": 4.971722571140592e-07, "loss": 1.3645, "step": 33037 }, { "epoch": 0.9, "learning_rate": 4.968968691303766e-07, "loss": 1.1663, "step": 33038 }, { "epoch": 0.9, "learning_rate": 4.966215554945042e-07, "loss": 1.3943, "step": 33039 }, { "epoch": 0.9, "learning_rate": 4.963463162085957e-07, "loss": 1.137, "step": 33040 }, { "epoch": 0.9, "learning_rate": 4.960711512748029e-07, "loss": 1.0999, "step": 33041 }, { "epoch": 0.9, "learning_rate": 4.957960606952817e-07, "loss": 1.3079, "step": 33042 }, { "epoch": 0.9, "learning_rate": 4.955210444721837e-07, "loss": 1.3813, "step": 33043 }, { "epoch": 0.9, "learning_rate": 4.952461026076594e-07, "loss": 1.1125, "step": 33044 }, { "epoch": 0.9, "learning_rate": 4.949712351038593e-07, "loss": 1.3376, "step": 33045 }, { "epoch": 0.9, "learning_rate": 4.946964419629352e-07, "loss": 1.3408, "step": 33046 }, { "epoch": 0.9, "learning_rate": 4.944217231870363e-07, "loss": 1.2532, "step": 33047 }, { "epoch": 0.9, "learning_rate": 4.941470787783131e-07, "loss": 1.2253, "step": 33048 }, { "epoch": 0.9, "learning_rate": 4.938725087389107e-07, "loss": 1.0107, "step": 33049 }, { "epoch": 0.9, "learning_rate": 4.935980130709805e-07, "loss": 1.2251, "step": 33050 }, { "epoch": 0.9, "learning_rate": 4.93323591776671e-07, "loss": 1.2014, "step": 33051 }, { "epoch": 0.9, "learning_rate": 4.930492448581259e-07, "loss": 1.6758, "step": 33052 }, { "epoch": 0.9, "learning_rate": 4.927749723174935e-07, "loss": 1.1016, "step": 33053 }, { "epoch": 0.9, "learning_rate": 4.925007741569176e-07, "loss": 1.2864, "step": 33054 }, { "epoch": 0.9, "learning_rate": 4.922266503785489e-07, "loss": 1.1833, "step": 33055 }, { "epoch": 0.9, "learning_rate": 4.919526009845243e-07, "loss": 1.2476, "step": 33056 }, { "epoch": 0.9, "learning_rate": 4.916786259769923e-07, "loss": 1.3503, "step": 33057 }, { "epoch": 0.9, "learning_rate": 4.914047253580956e-07, "loss": 1.175, "step": 33058 }, { "epoch": 0.9, "learning_rate": 4.91130899129979e-07, "loss": 1.25, "step": 33059 }, { "epoch": 0.9, "learning_rate": 4.908571472947799e-07, "loss": 1.4199, "step": 33060 }, { "epoch": 0.9, "learning_rate": 4.905834698546452e-07, "loss": 1.2603, "step": 33061 }, { "epoch": 0.9, "learning_rate": 4.903098668117123e-07, "loss": 1.3213, "step": 33062 }, { "epoch": 0.9, "learning_rate": 4.90036338168125e-07, "loss": 1.1716, "step": 33063 }, { "epoch": 0.9, "learning_rate": 4.897628839260193e-07, "loss": 1.2256, "step": 33064 }, { "epoch": 0.9, "learning_rate": 4.894895040875381e-07, "loss": 1.1985, "step": 33065 }, { "epoch": 0.9, "learning_rate": 4.892161986548183e-07, "loss": 1.3098, "step": 33066 }, { "epoch": 0.9, "learning_rate": 4.889429676299995e-07, "loss": 1.3801, "step": 33067 }, { "epoch": 0.9, "learning_rate": 4.886698110152177e-07, "loss": 1.3403, "step": 33068 }, { "epoch": 0.9, "learning_rate": 4.883967288126101e-07, "loss": 1.3086, "step": 33069 }, { "epoch": 0.9, "learning_rate": 4.88123721024315e-07, "loss": 1.2988, "step": 33070 }, { "epoch": 0.9, "learning_rate": 4.878507876524674e-07, "loss": 1.1292, "step": 33071 }, { "epoch": 0.9, "learning_rate": 4.875779286992022e-07, "loss": 1.2732, "step": 33072 }, { "epoch": 0.9, "learning_rate": 4.873051441666532e-07, "loss": 1.3533, "step": 33073 }, { "epoch": 0.9, "learning_rate": 4.870324340569566e-07, "loss": 1.3149, "step": 33074 }, { "epoch": 0.9, "learning_rate": 4.867597983722449e-07, "loss": 1.3181, "step": 33075 }, { "epoch": 0.9, "learning_rate": 4.864872371146512e-07, "loss": 1.1304, "step": 33076 }, { "epoch": 0.9, "learning_rate": 4.862147502863057e-07, "loss": 1.2146, "step": 33077 }, { "epoch": 0.9, "learning_rate": 4.859423378893446e-07, "loss": 1.2561, "step": 33078 }, { "epoch": 0.9, "learning_rate": 4.856699999258962e-07, "loss": 1.0754, "step": 33079 }, { "epoch": 0.9, "learning_rate": 4.853977363980921e-07, "loss": 1.1699, "step": 33080 }, { "epoch": 0.9, "learning_rate": 4.851255473080607e-07, "loss": 1.2708, "step": 33081 }, { "epoch": 0.9, "learning_rate": 4.848534326579335e-07, "loss": 1.1748, "step": 33082 }, { "epoch": 0.9, "learning_rate": 4.8458139244984e-07, "loss": 1.1992, "step": 33083 }, { "epoch": 0.9, "learning_rate": 4.84309426685905e-07, "loss": 1.3132, "step": 33084 }, { "epoch": 0.9, "learning_rate": 4.840375353682602e-07, "loss": 1.2083, "step": 33085 }, { "epoch": 0.9, "learning_rate": 4.837657184990307e-07, "loss": 1.2441, "step": 33086 }, { "epoch": 0.9, "learning_rate": 4.834939760803437e-07, "loss": 1.3003, "step": 33087 }, { "epoch": 0.9, "learning_rate": 4.832223081143228e-07, "loss": 1.1921, "step": 33088 }, { "epoch": 0.9, "learning_rate": 4.829507146030976e-07, "loss": 1.1943, "step": 33089 }, { "epoch": 0.9, "learning_rate": 4.826791955487898e-07, "loss": 1.5269, "step": 33090 }, { "epoch": 0.9, "learning_rate": 4.824077509535252e-07, "loss": 1.2656, "step": 33091 }, { "epoch": 0.9, "learning_rate": 4.821363808194258e-07, "loss": 1.1331, "step": 33092 }, { "epoch": 0.9, "learning_rate": 4.818650851486173e-07, "loss": 1.3203, "step": 33093 }, { "epoch": 0.9, "learning_rate": 4.815938639432194e-07, "loss": 1.3728, "step": 33094 }, { "epoch": 0.9, "learning_rate": 4.81322717205357e-07, "loss": 1.3411, "step": 33095 }, { "epoch": 0.9, "learning_rate": 4.810516449371472e-07, "loss": 1.1628, "step": 33096 }, { "epoch": 0.9, "learning_rate": 4.807806471407128e-07, "loss": 1.2004, "step": 33097 }, { "epoch": 0.9, "learning_rate": 4.805097238181777e-07, "loss": 1.2253, "step": 33098 }, { "epoch": 0.9, "learning_rate": 4.802388749716558e-07, "loss": 1.196, "step": 33099 }, { "epoch": 0.9, "learning_rate": 4.799681006032686e-07, "loss": 1.26, "step": 33100 }, { "epoch": 0.9, "learning_rate": 4.796974007151345e-07, "loss": 1.2776, "step": 33101 }, { "epoch": 0.9, "learning_rate": 4.794267753093729e-07, "loss": 1.2976, "step": 33102 }, { "epoch": 0.9, "learning_rate": 4.791562243880965e-07, "loss": 1.1938, "step": 33103 }, { "epoch": 0.9, "learning_rate": 4.78885747953427e-07, "loss": 1.2856, "step": 33104 }, { "epoch": 0.9, "learning_rate": 4.786153460074761e-07, "loss": 1.4067, "step": 33105 }, { "epoch": 0.9, "learning_rate": 4.783450185523641e-07, "loss": 1.094, "step": 33106 }, { "epoch": 0.9, "learning_rate": 4.780747655902007e-07, "loss": 1.2058, "step": 33107 }, { "epoch": 0.9, "learning_rate": 4.778045871231051e-07, "loss": 1.3184, "step": 33108 }, { "epoch": 0.9, "learning_rate": 4.77534483153187e-07, "loss": 1.1238, "step": 33109 }, { "epoch": 0.9, "learning_rate": 4.772644536825633e-07, "loss": 1.2859, "step": 33110 }, { "epoch": 0.9, "learning_rate": 4.769944987133423e-07, "loss": 1.1082, "step": 33111 }, { "epoch": 0.9, "learning_rate": 4.7672461824763815e-07, "loss": 1.1611, "step": 33112 }, { "epoch": 0.9, "learning_rate": 4.764548122875645e-07, "loss": 1.1106, "step": 33113 }, { "epoch": 0.9, "learning_rate": 4.761850808352286e-07, "loss": 1.3733, "step": 33114 }, { "epoch": 0.9, "learning_rate": 4.7591542389274325e-07, "loss": 1.2996, "step": 33115 }, { "epoch": 0.9, "learning_rate": 4.756458414622167e-07, "loss": 1.3376, "step": 33116 }, { "epoch": 0.9, "learning_rate": 4.753763335457584e-07, "loss": 1.1252, "step": 33117 }, { "epoch": 0.9, "learning_rate": 4.751069001454767e-07, "loss": 1.344, "step": 33118 }, { "epoch": 0.9, "learning_rate": 4.7483754126348094e-07, "loss": 1.0547, "step": 33119 }, { "epoch": 0.9, "learning_rate": 4.74568256901875e-07, "loss": 1.2422, "step": 33120 }, { "epoch": 0.9, "learning_rate": 4.742990470627695e-07, "loss": 1.2656, "step": 33121 }, { "epoch": 0.9, "learning_rate": 4.740299117482683e-07, "loss": 1.166, "step": 33122 }, { "epoch": 0.9, "learning_rate": 4.7376085096047855e-07, "loss": 1.2087, "step": 33123 }, { "epoch": 0.9, "learning_rate": 4.7349186470150186e-07, "loss": 1.1305, "step": 33124 }, { "epoch": 0.9, "learning_rate": 4.7322295297344776e-07, "loss": 1.2485, "step": 33125 }, { "epoch": 0.9, "learning_rate": 4.729541157784168e-07, "loss": 1.3069, "step": 33126 }, { "epoch": 0.9, "learning_rate": 4.7268535311851273e-07, "loss": 1.1399, "step": 33127 }, { "epoch": 0.9, "learning_rate": 4.7241666499583727e-07, "loss": 1.2083, "step": 33128 }, { "epoch": 0.9, "learning_rate": 4.7214805141249544e-07, "loss": 1.3347, "step": 33129 }, { "epoch": 0.9, "learning_rate": 4.718795123705866e-07, "loss": 1.365, "step": 33130 }, { "epoch": 0.9, "learning_rate": 4.716110478722102e-07, "loss": 1.333, "step": 33131 }, { "epoch": 0.9, "learning_rate": 4.713426579194702e-07, "loss": 1.3784, "step": 33132 }, { "epoch": 0.9, "learning_rate": 4.710743425144648e-07, "loss": 1.22, "step": 33133 }, { "epoch": 0.9, "learning_rate": 4.708061016592924e-07, "loss": 1.2136, "step": 33134 }, { "epoch": 0.9, "learning_rate": 4.705379353560513e-07, "loss": 1.1536, "step": 33135 }, { "epoch": 0.9, "learning_rate": 4.7026984360684204e-07, "loss": 1.4141, "step": 33136 }, { "epoch": 0.9, "learning_rate": 4.7000182641375956e-07, "loss": 1.1816, "step": 33137 }, { "epoch": 0.9, "learning_rate": 4.697338837789012e-07, "loss": 1.1956, "step": 33138 }, { "epoch": 0.91, "learning_rate": 4.694660157043629e-07, "loss": 1.1931, "step": 33139 }, { "epoch": 0.91, "learning_rate": 4.6919822219224196e-07, "loss": 1.2307, "step": 33140 }, { "epoch": 0.91, "learning_rate": 4.689305032446323e-07, "loss": 1.2839, "step": 33141 }, { "epoch": 0.91, "learning_rate": 4.686628588636288e-07, "loss": 1.1865, "step": 33142 }, { "epoch": 0.91, "learning_rate": 4.6839528905132326e-07, "loss": 1.1538, "step": 33143 }, { "epoch": 0.91, "learning_rate": 4.6812779380981166e-07, "loss": 1.3613, "step": 33144 }, { "epoch": 0.91, "learning_rate": 4.6786037314118794e-07, "loss": 1.1936, "step": 33145 }, { "epoch": 0.91, "learning_rate": 4.675930270475404e-07, "loss": 1.2986, "step": 33146 }, { "epoch": 0.91, "learning_rate": 4.673257555309629e-07, "loss": 1.4282, "step": 33147 }, { "epoch": 0.91, "learning_rate": 4.670585585935461e-07, "loss": 1.2041, "step": 33148 }, { "epoch": 0.91, "learning_rate": 4.6679143623738266e-07, "loss": 1.344, "step": 33149 }, { "epoch": 0.91, "learning_rate": 4.665243884645565e-07, "loss": 1.2485, "step": 33150 }, { "epoch": 0.91, "learning_rate": 4.662574152771626e-07, "loss": 1.3035, "step": 33151 }, { "epoch": 0.91, "learning_rate": 4.659905166772871e-07, "loss": 1.2581, "step": 33152 }, { "epoch": 0.91, "learning_rate": 4.6572369266701835e-07, "loss": 1.2263, "step": 33153 }, { "epoch": 0.91, "learning_rate": 4.654569432484457e-07, "loss": 1.3423, "step": 33154 }, { "epoch": 0.91, "learning_rate": 4.6519026842365313e-07, "loss": 1.218, "step": 33155 }, { "epoch": 0.91, "learning_rate": 4.6492366819472777e-07, "loss": 1.1487, "step": 33156 }, { "epoch": 0.91, "learning_rate": 4.6465714256375695e-07, "loss": 1.416, "step": 33157 }, { "epoch": 0.91, "learning_rate": 4.6439069153282556e-07, "loss": 1.1177, "step": 33158 }, { "epoch": 0.91, "learning_rate": 4.6412431510401537e-07, "loss": 1.1682, "step": 33159 }, { "epoch": 0.91, "learning_rate": 4.638580132794135e-07, "loss": 1.3389, "step": 33160 }, { "epoch": 0.91, "learning_rate": 4.635917860611028e-07, "loss": 1.1636, "step": 33161 }, { "epoch": 0.91, "learning_rate": 4.633256334511649e-07, "loss": 1.3174, "step": 33162 }, { "epoch": 0.91, "learning_rate": 4.630595554516826e-07, "loss": 1.207, "step": 33163 }, { "epoch": 0.91, "learning_rate": 4.627935520647386e-07, "loss": 1.1125, "step": 33164 }, { "epoch": 0.91, "learning_rate": 4.625276232924125e-07, "loss": 1.3008, "step": 33165 }, { "epoch": 0.91, "learning_rate": 4.622617691367859e-07, "loss": 1.2268, "step": 33166 }, { "epoch": 0.91, "learning_rate": 4.6199598959993707e-07, "loss": 1.2583, "step": 33167 }, { "epoch": 0.91, "learning_rate": 4.617302846839489e-07, "loss": 1.29, "step": 33168 }, { "epoch": 0.91, "learning_rate": 4.614646543908963e-07, "loss": 1.2307, "step": 33169 }, { "epoch": 0.91, "learning_rate": 4.6119909872285875e-07, "loss": 1.281, "step": 33170 }, { "epoch": 0.91, "learning_rate": 4.609336176819135e-07, "loss": 1.4048, "step": 33171 }, { "epoch": 0.91, "learning_rate": 4.6066821127013885e-07, "loss": 1.4075, "step": 33172 }, { "epoch": 0.91, "learning_rate": 4.604028794896109e-07, "loss": 1.3052, "step": 33173 }, { "epoch": 0.91, "learning_rate": 4.601376223424037e-07, "loss": 1.2354, "step": 33174 }, { "epoch": 0.91, "learning_rate": 4.598724398305954e-07, "loss": 1.1071, "step": 33175 }, { "epoch": 0.91, "learning_rate": 4.596073319562577e-07, "loss": 1.1504, "step": 33176 }, { "epoch": 0.91, "learning_rate": 4.5934229872146683e-07, "loss": 1.1887, "step": 33177 }, { "epoch": 0.91, "learning_rate": 4.590773401282944e-07, "loss": 1.3711, "step": 33178 }, { "epoch": 0.91, "learning_rate": 4.588124561788154e-07, "loss": 1.2439, "step": 33179 }, { "epoch": 0.91, "learning_rate": 4.585476468751016e-07, "loss": 1.0957, "step": 33180 }, { "epoch": 0.91, "learning_rate": 4.582829122192234e-07, "loss": 1.4087, "step": 33181 }, { "epoch": 0.91, "learning_rate": 4.580182522132526e-07, "loss": 1.2639, "step": 33182 }, { "epoch": 0.91, "learning_rate": 4.577536668592608e-07, "loss": 1.1755, "step": 33183 }, { "epoch": 0.91, "learning_rate": 4.5748915615931754e-07, "loss": 1.4043, "step": 33184 }, { "epoch": 0.91, "learning_rate": 4.572247201154911e-07, "loss": 1.3713, "step": 33185 }, { "epoch": 0.91, "learning_rate": 4.569603587298499e-07, "loss": 1.3755, "step": 33186 }, { "epoch": 0.91, "learning_rate": 4.566960720044655e-07, "loss": 1.2979, "step": 33187 }, { "epoch": 0.91, "learning_rate": 4.5643185994140193e-07, "loss": 1.1372, "step": 33188 }, { "epoch": 0.91, "learning_rate": 4.561677225427308e-07, "loss": 1.1877, "step": 33189 }, { "epoch": 0.91, "learning_rate": 4.5590365981051157e-07, "loss": 1.2017, "step": 33190 }, { "epoch": 0.91, "learning_rate": 4.5563967174681587e-07, "loss": 1.1309, "step": 33191 }, { "epoch": 0.91, "learning_rate": 4.5537575835370773e-07, "loss": 1.1936, "step": 33192 }, { "epoch": 0.91, "learning_rate": 4.5511191963325097e-07, "loss": 1.2864, "step": 33193 }, { "epoch": 0.91, "learning_rate": 4.5484815558751063e-07, "loss": 1.2314, "step": 33194 }, { "epoch": 0.91, "learning_rate": 4.5458446621854947e-07, "loss": 1.1726, "step": 33195 }, { "epoch": 0.91, "learning_rate": 4.5432085152843143e-07, "loss": 1.3201, "step": 33196 }, { "epoch": 0.91, "learning_rate": 4.540573115192182e-07, "loss": 1.1689, "step": 33197 }, { "epoch": 0.91, "learning_rate": 4.537938461929714e-07, "loss": 1.1887, "step": 33198 }, { "epoch": 0.91, "learning_rate": 4.5353045555175167e-07, "loss": 1.209, "step": 33199 }, { "epoch": 0.91, "learning_rate": 4.532671395976218e-07, "loss": 1.2793, "step": 33200 }, { "epoch": 0.91, "learning_rate": 4.5300389833264127e-07, "loss": 1.2717, "step": 33201 }, { "epoch": 0.91, "learning_rate": 4.527407317588683e-07, "loss": 1.2661, "step": 33202 }, { "epoch": 0.91, "learning_rate": 4.5247763987836146e-07, "loss": 1.2695, "step": 33203 }, { "epoch": 0.91, "learning_rate": 4.5221462269318115e-07, "loss": 1.1221, "step": 33204 }, { "epoch": 0.91, "learning_rate": 4.519516802053847e-07, "loss": 1.175, "step": 33205 }, { "epoch": 0.91, "learning_rate": 4.51688812417026e-07, "loss": 1.2905, "step": 33206 }, { "epoch": 0.91, "learning_rate": 4.5142601933016563e-07, "loss": 1.1765, "step": 33207 }, { "epoch": 0.91, "learning_rate": 4.5116330094685856e-07, "loss": 1.2349, "step": 33208 }, { "epoch": 0.91, "learning_rate": 4.509006572691588e-07, "loss": 1.3594, "step": 33209 }, { "epoch": 0.91, "learning_rate": 4.5063808829912123e-07, "loss": 1.1975, "step": 33210 }, { "epoch": 0.91, "learning_rate": 4.5037559403880215e-07, "loss": 1.3013, "step": 33211 }, { "epoch": 0.91, "learning_rate": 4.501131744902543e-07, "loss": 1.2117, "step": 33212 }, { "epoch": 0.91, "learning_rate": 4.498508296555304e-07, "loss": 1.1519, "step": 33213 }, { "epoch": 0.91, "learning_rate": 4.4958855953668003e-07, "loss": 1.3186, "step": 33214 }, { "epoch": 0.91, "learning_rate": 4.493263641357604e-07, "loss": 1.2253, "step": 33215 }, { "epoch": 0.91, "learning_rate": 4.490642434548198e-07, "loss": 1.3589, "step": 33216 }, { "epoch": 0.91, "learning_rate": 4.4880219749591e-07, "loss": 1.6753, "step": 33217 }, { "epoch": 0.91, "learning_rate": 4.485402262610783e-07, "loss": 1.1689, "step": 33218 }, { "epoch": 0.91, "learning_rate": 4.482783297523785e-07, "loss": 1.2466, "step": 33219 }, { "epoch": 0.91, "learning_rate": 4.480165079718568e-07, "loss": 1.2205, "step": 33220 }, { "epoch": 0.91, "learning_rate": 4.4775476092156155e-07, "loss": 1.1687, "step": 33221 }, { "epoch": 0.91, "learning_rate": 4.4749308860354223e-07, "loss": 1.2551, "step": 33222 }, { "epoch": 0.91, "learning_rate": 4.47231491019845e-07, "loss": 1.1875, "step": 33223 }, { "epoch": 0.91, "learning_rate": 4.4696996817251814e-07, "loss": 1.2688, "step": 33224 }, { "epoch": 0.91, "learning_rate": 4.467085200636034e-07, "loss": 1.4175, "step": 33225 }, { "epoch": 0.91, "learning_rate": 4.464471466951503e-07, "loss": 1.2529, "step": 33226 }, { "epoch": 0.91, "learning_rate": 4.461858480692005e-07, "loss": 1.2402, "step": 33227 }, { "epoch": 0.91, "learning_rate": 4.4592462418780346e-07, "loss": 1.2542, "step": 33228 }, { "epoch": 0.91, "learning_rate": 4.4566347505299646e-07, "loss": 1.4351, "step": 33229 }, { "epoch": 0.91, "learning_rate": 4.4540240066682783e-07, "loss": 1.2258, "step": 33230 }, { "epoch": 0.91, "learning_rate": 4.4514140103133596e-07, "loss": 1.2161, "step": 33231 }, { "epoch": 0.91, "learning_rate": 4.44880476148567e-07, "loss": 1.3396, "step": 33232 }, { "epoch": 0.91, "learning_rate": 4.446196260205582e-07, "loss": 1.1653, "step": 33233 }, { "epoch": 0.91, "learning_rate": 4.4435885064935346e-07, "loss": 1.2783, "step": 33234 }, { "epoch": 0.91, "learning_rate": 4.4409815003699006e-07, "loss": 1.3499, "step": 33235 }, { "epoch": 0.91, "learning_rate": 4.4383752418550975e-07, "loss": 1.3762, "step": 33236 }, { "epoch": 0.91, "learning_rate": 4.435769730969519e-07, "loss": 1.2563, "step": 33237 }, { "epoch": 0.91, "learning_rate": 4.4331649677335275e-07, "loss": 1.3865, "step": 33238 }, { "epoch": 0.91, "learning_rate": 4.4305609521675284e-07, "loss": 1.0933, "step": 33239 }, { "epoch": 0.91, "learning_rate": 4.427957684291884e-07, "loss": 1.3198, "step": 33240 }, { "epoch": 0.91, "learning_rate": 4.4253551641269545e-07, "loss": 1.1902, "step": 33241 }, { "epoch": 0.91, "learning_rate": 4.4227533916930907e-07, "loss": 1.2405, "step": 33242 }, { "epoch": 0.91, "learning_rate": 4.4201523670106663e-07, "loss": 1.3381, "step": 33243 }, { "epoch": 0.91, "learning_rate": 4.4175520901000303e-07, "loss": 1.2168, "step": 33244 }, { "epoch": 0.91, "learning_rate": 4.4149525609815224e-07, "loss": 1.2632, "step": 33245 }, { "epoch": 0.91, "learning_rate": 4.412353779675471e-07, "loss": 1.2896, "step": 33246 }, { "epoch": 0.91, "learning_rate": 4.4097557462022157e-07, "loss": 1.3425, "step": 33247 }, { "epoch": 0.91, "learning_rate": 4.407158460582084e-07, "loss": 1.3301, "step": 33248 }, { "epoch": 0.91, "learning_rate": 4.4045619228354043e-07, "loss": 1.1653, "step": 33249 }, { "epoch": 0.91, "learning_rate": 4.4019661329824605e-07, "loss": 1.3625, "step": 33250 }, { "epoch": 0.91, "learning_rate": 4.3993710910435917e-07, "loss": 1.2639, "step": 33251 }, { "epoch": 0.91, "learning_rate": 4.396776797039093e-07, "loss": 1.3818, "step": 33252 }, { "epoch": 0.91, "learning_rate": 4.3941832509892367e-07, "loss": 1.2415, "step": 33253 }, { "epoch": 0.91, "learning_rate": 4.391590452914352e-07, "loss": 1.2332, "step": 33254 }, { "epoch": 0.91, "learning_rate": 4.388998402834699e-07, "loss": 1.3464, "step": 33255 }, { "epoch": 0.91, "learning_rate": 4.3864071007705734e-07, "loss": 1.3528, "step": 33256 }, { "epoch": 0.91, "learning_rate": 4.3838165467422145e-07, "loss": 1.2156, "step": 33257 }, { "epoch": 0.91, "learning_rate": 4.3812267407699394e-07, "loss": 1.3752, "step": 33258 }, { "epoch": 0.91, "learning_rate": 4.3786376828739763e-07, "loss": 1.2275, "step": 33259 }, { "epoch": 0.91, "learning_rate": 4.3760493730745757e-07, "loss": 1.3848, "step": 33260 }, { "epoch": 0.91, "learning_rate": 4.373461811391999e-07, "loss": 1.1174, "step": 33261 }, { "epoch": 0.91, "learning_rate": 4.370874997846508e-07, "loss": 1.238, "step": 33262 }, { "epoch": 0.91, "learning_rate": 4.3682889324583086e-07, "loss": 1.3599, "step": 33263 }, { "epoch": 0.91, "learning_rate": 4.365703615247663e-07, "loss": 1.3098, "step": 33264 }, { "epoch": 0.91, "learning_rate": 4.363119046234754e-07, "loss": 1.2771, "step": 33265 }, { "epoch": 0.91, "learning_rate": 4.360535225439855e-07, "loss": 1.3181, "step": 33266 }, { "epoch": 0.91, "learning_rate": 4.357952152883149e-07, "loss": 1.3315, "step": 33267 }, { "epoch": 0.91, "learning_rate": 4.3553698285848436e-07, "loss": 1.1782, "step": 33268 }, { "epoch": 0.91, "learning_rate": 4.3527882525651545e-07, "loss": 1.1763, "step": 33269 }, { "epoch": 0.91, "learning_rate": 4.350207424844266e-07, "loss": 1.2219, "step": 33270 }, { "epoch": 0.91, "learning_rate": 4.3476273454424067e-07, "loss": 1.2046, "step": 33271 }, { "epoch": 0.91, "learning_rate": 4.345048014379694e-07, "loss": 1.3564, "step": 33272 }, { "epoch": 0.91, "learning_rate": 4.342469431676366e-07, "loss": 1.1609, "step": 33273 }, { "epoch": 0.91, "learning_rate": 4.3398915973525637e-07, "loss": 1.2112, "step": 33274 }, { "epoch": 0.91, "learning_rate": 4.337314511428492e-07, "loss": 1.4121, "step": 33275 }, { "epoch": 0.91, "learning_rate": 4.3347381739242576e-07, "loss": 1.353, "step": 33276 }, { "epoch": 0.91, "learning_rate": 4.332162584860067e-07, "loss": 1.2441, "step": 33277 }, { "epoch": 0.91, "learning_rate": 4.3295877442560365e-07, "loss": 1.0592, "step": 33278 }, { "epoch": 0.91, "learning_rate": 4.32701365213235e-07, "loss": 1.1741, "step": 33279 }, { "epoch": 0.91, "learning_rate": 4.3244403085090927e-07, "loss": 1.6333, "step": 33280 }, { "epoch": 0.91, "learning_rate": 4.3218677134064356e-07, "loss": 1.2952, "step": 33281 }, { "epoch": 0.91, "learning_rate": 4.319295866844475e-07, "loss": 1.093, "step": 33282 }, { "epoch": 0.91, "learning_rate": 4.316724768843372e-07, "loss": 1.2754, "step": 33283 }, { "epoch": 0.91, "learning_rate": 4.314154419423222e-07, "loss": 1.3718, "step": 33284 }, { "epoch": 0.91, "learning_rate": 4.31158481860412e-07, "loss": 1.3713, "step": 33285 }, { "epoch": 0.91, "learning_rate": 4.309015966406194e-07, "loss": 1.1533, "step": 33286 }, { "epoch": 0.91, "learning_rate": 4.306447862849528e-07, "loss": 1.3132, "step": 33287 }, { "epoch": 0.91, "learning_rate": 4.303880507954228e-07, "loss": 1.3135, "step": 33288 }, { "epoch": 0.91, "learning_rate": 4.3013139017403336e-07, "loss": 1.3213, "step": 33289 }, { "epoch": 0.91, "learning_rate": 4.298748044227985e-07, "loss": 1.1763, "step": 33290 }, { "epoch": 0.91, "learning_rate": 4.296182935437232e-07, "loss": 1.301, "step": 33291 }, { "epoch": 0.91, "learning_rate": 4.2936185753881363e-07, "loss": 1.3477, "step": 33292 }, { "epoch": 0.91, "learning_rate": 4.2910549641007494e-07, "loss": 1.6636, "step": 33293 }, { "epoch": 0.91, "learning_rate": 4.2884921015951544e-07, "loss": 1.2578, "step": 33294 }, { "epoch": 0.91, "learning_rate": 4.285929987891402e-07, "loss": 1.3044, "step": 33295 }, { "epoch": 0.91, "learning_rate": 4.2833686230095095e-07, "loss": 1.3352, "step": 33296 }, { "epoch": 0.91, "learning_rate": 4.280808006969528e-07, "loss": 1.3274, "step": 33297 }, { "epoch": 0.91, "learning_rate": 4.278248139791508e-07, "loss": 1.2939, "step": 33298 }, { "epoch": 0.91, "learning_rate": 4.275689021495455e-07, "loss": 1.189, "step": 33299 }, { "epoch": 0.91, "learning_rate": 4.273130652101398e-07, "loss": 1.114, "step": 33300 }, { "epoch": 0.91, "learning_rate": 4.270573031629355e-07, "loss": 1.2024, "step": 33301 }, { "epoch": 0.91, "learning_rate": 4.268016160099342e-07, "loss": 1.1853, "step": 33302 }, { "epoch": 0.91, "learning_rate": 4.265460037531344e-07, "loss": 1.1287, "step": 33303 }, { "epoch": 0.91, "learning_rate": 4.2629046639453665e-07, "loss": 1.2617, "step": 33304 }, { "epoch": 0.91, "learning_rate": 4.260350039361416e-07, "loss": 1.0032, "step": 33305 }, { "epoch": 0.91, "learning_rate": 4.2577961637994544e-07, "loss": 1.2471, "step": 33306 }, { "epoch": 0.91, "learning_rate": 4.2552430372794886e-07, "loss": 1.2488, "step": 33307 }, { "epoch": 0.91, "learning_rate": 4.2526906598214565e-07, "loss": 1.2903, "step": 33308 }, { "epoch": 0.91, "learning_rate": 4.2501390314453663e-07, "loss": 1.2185, "step": 33309 }, { "epoch": 0.91, "learning_rate": 4.247588152171167e-07, "loss": 1.2832, "step": 33310 }, { "epoch": 0.91, "learning_rate": 4.2450380220188104e-07, "loss": 1.2979, "step": 33311 }, { "epoch": 0.91, "learning_rate": 4.2424886410082356e-07, "loss": 1.1721, "step": 33312 }, { "epoch": 0.91, "learning_rate": 4.2399400091594154e-07, "loss": 1.0645, "step": 33313 }, { "epoch": 0.91, "learning_rate": 4.237392126492268e-07, "loss": 1.3835, "step": 33314 }, { "epoch": 0.91, "learning_rate": 4.2348449930267213e-07, "loss": 1.2815, "step": 33315 }, { "epoch": 0.91, "learning_rate": 4.2322986087827367e-07, "loss": 1.1624, "step": 33316 }, { "epoch": 0.91, "learning_rate": 4.229752973780199e-07, "loss": 1.2688, "step": 33317 }, { "epoch": 0.91, "learning_rate": 4.227208088039059e-07, "loss": 1.2083, "step": 33318 }, { "epoch": 0.91, "learning_rate": 4.2246639515791886e-07, "loss": 1.2637, "step": 33319 }, { "epoch": 0.91, "learning_rate": 4.2221205644205285e-07, "loss": 1.3606, "step": 33320 }, { "epoch": 0.91, "learning_rate": 4.219577926582941e-07, "loss": 1.2847, "step": 33321 }, { "epoch": 0.91, "learning_rate": 4.2170360380863527e-07, "loss": 1.1404, "step": 33322 }, { "epoch": 0.91, "learning_rate": 4.214494898950616e-07, "loss": 1.2861, "step": 33323 }, { "epoch": 0.91, "learning_rate": 4.211954509195648e-07, "loss": 1.1697, "step": 33324 }, { "epoch": 0.91, "learning_rate": 4.2094148688412886e-07, "loss": 1.1287, "step": 33325 }, { "epoch": 0.91, "learning_rate": 4.206875977907443e-07, "loss": 1.1548, "step": 33326 }, { "epoch": 0.91, "learning_rate": 4.2043378364139407e-07, "loss": 1.4109, "step": 33327 }, { "epoch": 0.91, "learning_rate": 4.201800444380655e-07, "loss": 1.2671, "step": 33328 }, { "epoch": 0.91, "learning_rate": 4.1992638018274246e-07, "loss": 1.2397, "step": 33329 }, { "epoch": 0.91, "learning_rate": 4.196727908774123e-07, "loss": 1.333, "step": 33330 }, { "epoch": 0.91, "learning_rate": 4.194192765240568e-07, "loss": 1.2483, "step": 33331 }, { "epoch": 0.91, "learning_rate": 4.1916583712465874e-07, "loss": 1.2722, "step": 33332 }, { "epoch": 0.91, "learning_rate": 4.189124726812033e-07, "loss": 1.4272, "step": 33333 }, { "epoch": 0.91, "learning_rate": 4.18659183195671e-07, "loss": 1.1655, "step": 33334 }, { "epoch": 0.91, "learning_rate": 4.184059686700437e-07, "loss": 1.2291, "step": 33335 }, { "epoch": 0.91, "learning_rate": 4.1815282910630196e-07, "loss": 1.1274, "step": 33336 }, { "epoch": 0.91, "learning_rate": 4.1789976450642755e-07, "loss": 1.3274, "step": 33337 }, { "epoch": 0.91, "learning_rate": 4.1764677487240003e-07, "loss": 1.2471, "step": 33338 }, { "epoch": 0.91, "learning_rate": 4.1739386020619776e-07, "loss": 1.3518, "step": 33339 }, { "epoch": 0.91, "learning_rate": 4.171410205097981e-07, "loss": 1.28, "step": 33340 }, { "epoch": 0.91, "learning_rate": 4.1688825578518275e-07, "loss": 1.0231, "step": 33341 }, { "epoch": 0.91, "learning_rate": 4.16635566034328e-07, "loss": 1.2086, "step": 33342 }, { "epoch": 0.91, "learning_rate": 4.163829512592088e-07, "loss": 1.397, "step": 33343 }, { "epoch": 0.91, "learning_rate": 4.1613041146180254e-07, "loss": 1.3376, "step": 33344 }, { "epoch": 0.91, "learning_rate": 4.1587794664408656e-07, "loss": 1.2463, "step": 33345 }, { "epoch": 0.91, "learning_rate": 4.1562555680803475e-07, "loss": 1.2341, "step": 33346 }, { "epoch": 0.91, "learning_rate": 4.1537324195562003e-07, "loss": 1.3457, "step": 33347 }, { "epoch": 0.91, "learning_rate": 4.1512100208881967e-07, "loss": 1.2415, "step": 33348 }, { "epoch": 0.91, "learning_rate": 4.1486883720960436e-07, "loss": 1.4011, "step": 33349 }, { "epoch": 0.91, "learning_rate": 4.1461674731994917e-07, "loss": 1.1602, "step": 33350 }, { "epoch": 0.91, "learning_rate": 4.143647324218236e-07, "loss": 1.7222, "step": 33351 }, { "epoch": 0.91, "learning_rate": 4.1411279251720283e-07, "loss": 1.3298, "step": 33352 }, { "epoch": 0.91, "learning_rate": 4.138609276080552e-07, "loss": 1.137, "step": 33353 }, { "epoch": 0.91, "learning_rate": 4.1360913769635246e-07, "loss": 1.1995, "step": 33354 }, { "epoch": 0.91, "learning_rate": 4.13357422784062e-07, "loss": 1.3667, "step": 33355 }, { "epoch": 0.91, "learning_rate": 4.1310578287315663e-07, "loss": 1.3069, "step": 33356 }, { "epoch": 0.91, "learning_rate": 4.1285421796560363e-07, "loss": 1.2659, "step": 33357 }, { "epoch": 0.91, "learning_rate": 4.1260272806337154e-07, "loss": 1.3896, "step": 33358 }, { "epoch": 0.91, "learning_rate": 4.1235131316842536e-07, "loss": 1.105, "step": 33359 }, { "epoch": 0.91, "learning_rate": 4.1209997328273467e-07, "loss": 1.3843, "step": 33360 }, { "epoch": 0.91, "learning_rate": 4.1184870840826787e-07, "loss": 1.1616, "step": 33361 }, { "epoch": 0.91, "learning_rate": 4.115975185469845e-07, "loss": 1.1758, "step": 33362 }, { "epoch": 0.91, "learning_rate": 4.113464037008552e-07, "loss": 1.2371, "step": 33363 }, { "epoch": 0.91, "learning_rate": 4.110953638718418e-07, "loss": 1.2375, "step": 33364 }, { "epoch": 0.91, "learning_rate": 4.1084439906191156e-07, "loss": 1.2815, "step": 33365 }, { "epoch": 0.91, "learning_rate": 4.105935092730229e-07, "loss": 1.2021, "step": 33366 }, { "epoch": 0.91, "learning_rate": 4.103426945071431e-07, "loss": 1.2888, "step": 33367 }, { "epoch": 0.91, "learning_rate": 4.1009195476623075e-07, "loss": 1.2334, "step": 33368 }, { "epoch": 0.91, "learning_rate": 4.0984129005225303e-07, "loss": 1.2415, "step": 33369 }, { "epoch": 0.91, "learning_rate": 4.0959070036716396e-07, "loss": 1.2219, "step": 33370 }, { "epoch": 0.91, "learning_rate": 4.0934018571292976e-07, "loss": 1.4146, "step": 33371 }, { "epoch": 0.91, "learning_rate": 4.0908974609150555e-07, "loss": 1.2024, "step": 33372 }, { "epoch": 0.91, "learning_rate": 4.0883938150485634e-07, "loss": 1.2563, "step": 33373 }, { "epoch": 0.91, "learning_rate": 4.085890919549351e-07, "loss": 1.3108, "step": 33374 }, { "epoch": 0.91, "learning_rate": 4.0833887744370473e-07, "loss": 1.4062, "step": 33375 }, { "epoch": 0.91, "learning_rate": 4.08088737973118e-07, "loss": 1.2698, "step": 33376 }, { "epoch": 0.91, "learning_rate": 4.0783867354513673e-07, "loss": 1.198, "step": 33377 }, { "epoch": 0.91, "learning_rate": 4.0758868416171495e-07, "loss": 1.1445, "step": 33378 }, { "epoch": 0.91, "learning_rate": 4.073387698248077e-07, "loss": 1.1611, "step": 33379 }, { "epoch": 0.91, "learning_rate": 4.0708893053637124e-07, "loss": 1.324, "step": 33380 }, { "epoch": 0.91, "learning_rate": 4.0683916629836063e-07, "loss": 1.0725, "step": 33381 }, { "epoch": 0.91, "learning_rate": 4.0658947711272987e-07, "loss": 1.4282, "step": 33382 }, { "epoch": 0.91, "learning_rate": 4.063398629814308e-07, "loss": 1.2468, "step": 33383 }, { "epoch": 0.91, "learning_rate": 4.0609032390641733e-07, "loss": 1.147, "step": 33384 }, { "epoch": 0.91, "learning_rate": 4.058408598896435e-07, "loss": 1.2588, "step": 33385 }, { "epoch": 0.91, "learning_rate": 4.055914709330577e-07, "loss": 1.272, "step": 33386 }, { "epoch": 0.91, "learning_rate": 4.053421570386129e-07, "loss": 1.1802, "step": 33387 }, { "epoch": 0.91, "learning_rate": 4.050929182082597e-07, "loss": 1.3176, "step": 33388 }, { "epoch": 0.91, "learning_rate": 4.048437544439476e-07, "loss": 1.3516, "step": 33389 }, { "epoch": 0.91, "learning_rate": 4.045946657476263e-07, "loss": 1.009, "step": 33390 }, { "epoch": 0.91, "learning_rate": 4.0434565212124297e-07, "loss": 1.3589, "step": 33391 }, { "epoch": 0.91, "learning_rate": 4.0409671356674727e-07, "loss": 1.2942, "step": 33392 }, { "epoch": 0.91, "learning_rate": 4.038478500860876e-07, "loss": 1.1873, "step": 33393 }, { "epoch": 0.91, "learning_rate": 4.035990616812091e-07, "loss": 1.4458, "step": 33394 }, { "epoch": 0.91, "learning_rate": 4.0335034835406016e-07, "loss": 1.2996, "step": 33395 }, { "epoch": 0.91, "learning_rate": 4.031017101065848e-07, "loss": 1.1348, "step": 33396 }, { "epoch": 0.91, "learning_rate": 4.028531469407293e-07, "loss": 1.3357, "step": 33397 }, { "epoch": 0.91, "learning_rate": 4.0260465885843647e-07, "loss": 1.0464, "step": 33398 }, { "epoch": 0.91, "learning_rate": 4.0235624586165257e-07, "loss": 1.1719, "step": 33399 }, { "epoch": 0.91, "learning_rate": 4.021079079523205e-07, "loss": 1.3115, "step": 33400 }, { "epoch": 0.91, "learning_rate": 4.0185964513238305e-07, "loss": 1.3545, "step": 33401 }, { "epoch": 0.91, "learning_rate": 4.0161145740378103e-07, "loss": 1.0198, "step": 33402 }, { "epoch": 0.91, "learning_rate": 4.013633447684595e-07, "loss": 1.1489, "step": 33403 }, { "epoch": 0.91, "learning_rate": 4.011153072283569e-07, "loss": 1.3835, "step": 33404 }, { "epoch": 0.91, "learning_rate": 4.008673447854139e-07, "loss": 1.2495, "step": 33405 }, { "epoch": 0.91, "learning_rate": 4.0061945744157007e-07, "loss": 1.2949, "step": 33406 }, { "epoch": 0.91, "learning_rate": 4.0037164519876604e-07, "loss": 1.6885, "step": 33407 }, { "epoch": 0.91, "learning_rate": 4.0012390805894254e-07, "loss": 1.3811, "step": 33408 }, { "epoch": 0.91, "learning_rate": 3.9987624602403355e-07, "loss": 1.1677, "step": 33409 }, { "epoch": 0.91, "learning_rate": 3.9962865909597857e-07, "loss": 1.1736, "step": 33410 }, { "epoch": 0.91, "learning_rate": 3.9938114727671396e-07, "loss": 1.2371, "step": 33411 }, { "epoch": 0.91, "learning_rate": 3.991337105681792e-07, "loss": 1.1455, "step": 33412 }, { "epoch": 0.91, "learning_rate": 3.988863489723049e-07, "loss": 1.1741, "step": 33413 }, { "epoch": 0.91, "learning_rate": 3.986390624910308e-07, "loss": 1.2134, "step": 33414 }, { "epoch": 0.91, "learning_rate": 3.983918511262874e-07, "loss": 1.6904, "step": 33415 }, { "epoch": 0.91, "learning_rate": 3.981447148800133e-07, "loss": 1.2083, "step": 33416 }, { "epoch": 0.91, "learning_rate": 3.9789765375414016e-07, "loss": 1.2336, "step": 33417 }, { "epoch": 0.91, "learning_rate": 3.976506677505998e-07, "loss": 1.2261, "step": 33418 }, { "epoch": 0.91, "learning_rate": 3.9740375687132513e-07, "loss": 1.3115, "step": 33419 }, { "epoch": 0.91, "learning_rate": 3.97156921118248e-07, "loss": 1.2976, "step": 33420 }, { "epoch": 0.91, "learning_rate": 3.969101604933001e-07, "loss": 1.3281, "step": 33421 }, { "epoch": 0.91, "learning_rate": 3.9666347499840997e-07, "loss": 1.2715, "step": 33422 }, { "epoch": 0.91, "learning_rate": 3.9641686463551046e-07, "loss": 1.1653, "step": 33423 }, { "epoch": 0.91, "learning_rate": 3.9617032940652887e-07, "loss": 1.3074, "step": 33424 }, { "epoch": 0.91, "learning_rate": 3.95923869313396e-07, "loss": 1.302, "step": 33425 }, { "epoch": 0.91, "learning_rate": 3.956774843580358e-07, "loss": 1.3528, "step": 33426 }, { "epoch": 0.91, "learning_rate": 3.954311745423811e-07, "loss": 1.2483, "step": 33427 }, { "epoch": 0.91, "learning_rate": 3.9518493986835604e-07, "loss": 1.3997, "step": 33428 }, { "epoch": 0.91, "learning_rate": 3.9493878033788677e-07, "loss": 1.4167, "step": 33429 }, { "epoch": 0.91, "learning_rate": 3.946926959528996e-07, "loss": 1.254, "step": 33430 }, { "epoch": 0.91, "learning_rate": 3.9444668671532185e-07, "loss": 1.3508, "step": 33431 }, { "epoch": 0.91, "learning_rate": 3.9420075262707527e-07, "loss": 1.1768, "step": 33432 }, { "epoch": 0.91, "learning_rate": 3.93954893690085e-07, "loss": 1.2271, "step": 33433 }, { "epoch": 0.91, "learning_rate": 3.93709109906274e-07, "loss": 1.7378, "step": 33434 }, { "epoch": 0.91, "learning_rate": 3.934634012775662e-07, "loss": 1.1948, "step": 33435 }, { "epoch": 0.91, "learning_rate": 3.932177678058835e-07, "loss": 1.1758, "step": 33436 }, { "epoch": 0.91, "learning_rate": 3.9297220949314875e-07, "loss": 1.1985, "step": 33437 }, { "epoch": 0.91, "learning_rate": 3.927267263412793e-07, "loss": 1.2654, "step": 33438 }, { "epoch": 0.91, "learning_rate": 3.9248131835220026e-07, "loss": 1.2837, "step": 33439 }, { "epoch": 0.91, "learning_rate": 3.92235985527829e-07, "loss": 1.3203, "step": 33440 }, { "epoch": 0.91, "learning_rate": 3.919907278700852e-07, "loss": 1.2139, "step": 33441 }, { "epoch": 0.91, "learning_rate": 3.9174554538088825e-07, "loss": 1.1674, "step": 33442 }, { "epoch": 0.91, "learning_rate": 3.9150043806215674e-07, "loss": 1.1936, "step": 33443 }, { "epoch": 0.91, "learning_rate": 3.912554059158069e-07, "loss": 1.1885, "step": 33444 }, { "epoch": 0.91, "learning_rate": 3.9101044894375605e-07, "loss": 1.2864, "step": 33445 }, { "epoch": 0.91, "learning_rate": 3.9076556714792156e-07, "loss": 1.2162, "step": 33446 }, { "epoch": 0.91, "learning_rate": 3.9052076053021857e-07, "loss": 1.2255, "step": 33447 }, { "epoch": 0.91, "learning_rate": 3.9027602909256224e-07, "loss": 1.3083, "step": 33448 }, { "epoch": 0.91, "learning_rate": 3.9003137283686766e-07, "loss": 1.2744, "step": 33449 }, { "epoch": 0.91, "learning_rate": 3.8978679176504884e-07, "loss": 1.2925, "step": 33450 }, { "epoch": 0.91, "learning_rate": 3.8954228587901766e-07, "loss": 1.6143, "step": 33451 }, { "epoch": 0.91, "learning_rate": 3.892978551806914e-07, "loss": 1.2605, "step": 33452 }, { "epoch": 0.91, "learning_rate": 3.890534996719764e-07, "loss": 1.2466, "step": 33453 }, { "epoch": 0.91, "learning_rate": 3.888092193547888e-07, "loss": 1.1223, "step": 33454 }, { "epoch": 0.91, "learning_rate": 3.885650142310382e-07, "loss": 1.0957, "step": 33455 }, { "epoch": 0.91, "learning_rate": 3.8832088430263535e-07, "loss": 1.3047, "step": 33456 }, { "epoch": 0.91, "learning_rate": 3.8807682957149096e-07, "loss": 1.2446, "step": 33457 }, { "epoch": 0.91, "learning_rate": 3.878328500395123e-07, "loss": 1.2976, "step": 33458 }, { "epoch": 0.91, "learning_rate": 3.8758894570861016e-07, "loss": 1.2659, "step": 33459 }, { "epoch": 0.91, "learning_rate": 3.8734511658069297e-07, "loss": 1.2947, "step": 33460 }, { "epoch": 0.91, "learning_rate": 3.8710136265766585e-07, "loss": 1.2673, "step": 33461 }, { "epoch": 0.91, "learning_rate": 3.868576839414373e-07, "loss": 1.2302, "step": 33462 }, { "epoch": 0.91, "learning_rate": 3.8661408043391467e-07, "loss": 1.2627, "step": 33463 }, { "epoch": 0.91, "learning_rate": 3.8637055213700316e-07, "loss": 1.5806, "step": 33464 }, { "epoch": 0.91, "learning_rate": 3.8612709905260783e-07, "loss": 1.3984, "step": 33465 }, { "epoch": 0.91, "learning_rate": 3.8588372118263164e-07, "loss": 1.2117, "step": 33466 }, { "epoch": 0.91, "learning_rate": 3.856404185289819e-07, "loss": 1.3049, "step": 33467 }, { "epoch": 0.91, "learning_rate": 3.8539719109356053e-07, "loss": 1.2725, "step": 33468 }, { "epoch": 0.91, "learning_rate": 3.851540388782693e-07, "loss": 1.2373, "step": 33469 }, { "epoch": 0.91, "learning_rate": 3.8491096188501334e-07, "loss": 1.1533, "step": 33470 }, { "epoch": 0.91, "learning_rate": 3.846679601156922e-07, "loss": 1.1084, "step": 33471 }, { "epoch": 0.91, "learning_rate": 3.8442503357220664e-07, "loss": 1.2021, "step": 33472 }, { "epoch": 0.91, "learning_rate": 3.841821822564584e-07, "loss": 1.2546, "step": 33473 }, { "epoch": 0.91, "learning_rate": 3.839394061703472e-07, "loss": 1.344, "step": 33474 }, { "epoch": 0.91, "learning_rate": 3.8369670531577255e-07, "loss": 1.3525, "step": 33475 }, { "epoch": 0.91, "learning_rate": 3.834540796946329e-07, "loss": 1.3069, "step": 33476 }, { "epoch": 0.91, "learning_rate": 3.8321152930882566e-07, "loss": 1.1327, "step": 33477 }, { "epoch": 0.91, "learning_rate": 3.8296905416025043e-07, "loss": 1.1797, "step": 33478 }, { "epoch": 0.91, "learning_rate": 3.8272665425080235e-07, "loss": 1.2454, "step": 33479 }, { "epoch": 0.91, "learning_rate": 3.824843295823799e-07, "loss": 1.426, "step": 33480 }, { "epoch": 0.91, "learning_rate": 3.8224208015687494e-07, "loss": 1.2761, "step": 33481 }, { "epoch": 0.91, "learning_rate": 3.81999905976187e-07, "loss": 1.3071, "step": 33482 }, { "epoch": 0.91, "learning_rate": 3.817578070422101e-07, "loss": 1.4385, "step": 33483 }, { "epoch": 0.91, "learning_rate": 3.81515783356835e-07, "loss": 1.2197, "step": 33484 }, { "epoch": 0.91, "learning_rate": 3.812738349219591e-07, "loss": 1.3601, "step": 33485 }, { "epoch": 0.91, "learning_rate": 3.81031961739472e-07, "loss": 1.1697, "step": 33486 }, { "epoch": 0.91, "learning_rate": 3.8079016381127097e-07, "loss": 1.1622, "step": 33487 }, { "epoch": 0.91, "learning_rate": 3.8054844113924127e-07, "loss": 1.2563, "step": 33488 }, { "epoch": 0.91, "learning_rate": 3.803067937252791e-07, "loss": 1.2129, "step": 33489 }, { "epoch": 0.91, "learning_rate": 3.800652215712708e-07, "loss": 1.1609, "step": 33490 }, { "epoch": 0.91, "learning_rate": 3.7982372467911145e-07, "loss": 1.2598, "step": 33491 }, { "epoch": 0.91, "learning_rate": 3.7958230305068513e-07, "loss": 1.2383, "step": 33492 }, { "epoch": 0.91, "learning_rate": 3.7934095668788476e-07, "loss": 1.2856, "step": 33493 }, { "epoch": 0.91, "learning_rate": 3.7909968559259544e-07, "loss": 1.3657, "step": 33494 }, { "epoch": 0.91, "learning_rate": 3.7885848976670804e-07, "loss": 1.189, "step": 33495 }, { "epoch": 0.91, "learning_rate": 3.7861736921210533e-07, "loss": 1.0927, "step": 33496 }, { "epoch": 0.91, "learning_rate": 3.783763239306781e-07, "loss": 1.1458, "step": 33497 }, { "epoch": 0.91, "learning_rate": 3.7813535392430824e-07, "loss": 1.0042, "step": 33498 }, { "epoch": 0.91, "learning_rate": 3.778944591948852e-07, "loss": 1.2622, "step": 33499 }, { "epoch": 0.91, "learning_rate": 3.776536397442887e-07, "loss": 1.3296, "step": 33500 }, { "epoch": 0.91, "learning_rate": 3.774128955744061e-07, "loss": 1.3218, "step": 33501 }, { "epoch": 0.91, "learning_rate": 3.771722266871203e-07, "loss": 1.3486, "step": 33502 }, { "epoch": 0.91, "learning_rate": 3.7693163308431426e-07, "loss": 1.3049, "step": 33503 }, { "epoch": 0.91, "learning_rate": 3.7669111476787093e-07, "loss": 1.2756, "step": 33504 }, { "epoch": 0.91, "learning_rate": 3.764506717396688e-07, "loss": 1.2178, "step": 33505 }, { "epoch": 0.92, "learning_rate": 3.76210304001593e-07, "loss": 1.2302, "step": 33506 }, { "epoch": 0.92, "learning_rate": 3.7597001155552315e-07, "loss": 1.3662, "step": 33507 }, { "epoch": 0.92, "learning_rate": 3.757297944033367e-07, "loss": 1.1711, "step": 33508 }, { "epoch": 0.92, "learning_rate": 3.754896525469154e-07, "loss": 1.2419, "step": 33509 }, { "epoch": 0.92, "learning_rate": 3.752495859881367e-07, "loss": 1.2898, "step": 33510 }, { "epoch": 0.92, "learning_rate": 3.750095947288801e-07, "loss": 1.2144, "step": 33511 }, { "epoch": 0.92, "learning_rate": 3.747696787710231e-07, "loss": 1.2273, "step": 33512 }, { "epoch": 0.92, "learning_rate": 3.745298381164397e-07, "loss": 1.3853, "step": 33513 }, { "epoch": 0.92, "learning_rate": 3.7429007276701067e-07, "loss": 0.9113, "step": 33514 }, { "epoch": 0.92, "learning_rate": 3.7405038272461e-07, "loss": 1.1843, "step": 33515 }, { "epoch": 0.92, "learning_rate": 3.738107679911107e-07, "loss": 1.2458, "step": 33516 }, { "epoch": 0.92, "learning_rate": 3.735712285683912e-07, "loss": 1.0286, "step": 33517 }, { "epoch": 0.92, "learning_rate": 3.733317644583234e-07, "loss": 1.0837, "step": 33518 }, { "epoch": 0.92, "learning_rate": 3.730923756627802e-07, "loss": 1.3389, "step": 33519 }, { "epoch": 0.92, "learning_rate": 3.728530621836357e-07, "loss": 1.1687, "step": 33520 }, { "epoch": 0.92, "learning_rate": 3.726138240227628e-07, "loss": 1.2947, "step": 33521 }, { "epoch": 0.92, "learning_rate": 3.7237466118203115e-07, "loss": 1.2419, "step": 33522 }, { "epoch": 0.92, "learning_rate": 3.7213557366331365e-07, "loss": 1.1963, "step": 33523 }, { "epoch": 0.92, "learning_rate": 3.7189656146847884e-07, "loss": 1.3542, "step": 33524 }, { "epoch": 0.92, "learning_rate": 3.716576245993997e-07, "loss": 1.2661, "step": 33525 }, { "epoch": 0.92, "learning_rate": 3.7141876305794244e-07, "loss": 1.0327, "step": 33526 }, { "epoch": 0.92, "learning_rate": 3.7117997684597785e-07, "loss": 1.259, "step": 33527 }, { "epoch": 0.92, "learning_rate": 3.709412659653722e-07, "loss": 1.3306, "step": 33528 }, { "epoch": 0.92, "learning_rate": 3.7070263041799505e-07, "loss": 1.3228, "step": 33529 }, { "epoch": 0.92, "learning_rate": 3.7046407020571274e-07, "loss": 1.4324, "step": 33530 }, { "epoch": 0.92, "learning_rate": 3.702255853303904e-07, "loss": 1.2214, "step": 33531 }, { "epoch": 0.92, "learning_rate": 3.699871757938955e-07, "loss": 1.3633, "step": 33532 }, { "epoch": 0.92, "learning_rate": 3.697488415980921e-07, "loss": 1.1865, "step": 33533 }, { "epoch": 0.92, "learning_rate": 3.695105827448475e-07, "loss": 1.3052, "step": 33534 }, { "epoch": 0.92, "learning_rate": 3.6927239923602143e-07, "loss": 1.1909, "step": 33535 }, { "epoch": 0.92, "learning_rate": 3.690342910734801e-07, "loss": 1.2808, "step": 33536 }, { "epoch": 0.92, "learning_rate": 3.687962582590843e-07, "loss": 1.4009, "step": 33537 }, { "epoch": 0.92, "learning_rate": 3.685583007947002e-07, "loss": 1.2717, "step": 33538 }, { "epoch": 0.92, "learning_rate": 3.683204186821843e-07, "loss": 1.3604, "step": 33539 }, { "epoch": 0.92, "learning_rate": 3.6808261192340154e-07, "loss": 1.498, "step": 33540 }, { "epoch": 0.92, "learning_rate": 3.678448805202106e-07, "loss": 1.2075, "step": 33541 }, { "epoch": 0.92, "learning_rate": 3.676072244744744e-07, "loss": 1.0715, "step": 33542 }, { "epoch": 0.92, "learning_rate": 3.6736964378804696e-07, "loss": 1.0634, "step": 33543 }, { "epoch": 0.92, "learning_rate": 3.671321384627913e-07, "loss": 1.252, "step": 33544 }, { "epoch": 0.92, "learning_rate": 3.6689470850056254e-07, "loss": 1.8589, "step": 33545 }, { "epoch": 0.92, "learning_rate": 3.6665735390322253e-07, "loss": 1.1339, "step": 33546 }, { "epoch": 0.92, "learning_rate": 3.6642007467262317e-07, "loss": 1.1826, "step": 33547 }, { "epoch": 0.92, "learning_rate": 3.6618287081062186e-07, "loss": 1.2136, "step": 33548 }, { "epoch": 0.92, "learning_rate": 3.659457423190782e-07, "loss": 1.2393, "step": 33549 }, { "epoch": 0.92, "learning_rate": 3.6570868919984405e-07, "loss": 1.2239, "step": 33550 }, { "epoch": 0.92, "learning_rate": 3.6547171145477566e-07, "loss": 1.2419, "step": 33551 }, { "epoch": 0.92, "learning_rate": 3.6523480908572383e-07, "loss": 1.4033, "step": 33552 }, { "epoch": 0.92, "learning_rate": 3.6499798209454596e-07, "loss": 1.2256, "step": 33553 }, { "epoch": 0.92, "learning_rate": 3.6476123048309387e-07, "loss": 1.1626, "step": 33554 }, { "epoch": 0.92, "learning_rate": 3.645245542532183e-07, "loss": 1.2156, "step": 33555 }, { "epoch": 0.92, "learning_rate": 3.6428795340677114e-07, "loss": 1.2473, "step": 33556 }, { "epoch": 0.92, "learning_rate": 3.640514279456042e-07, "loss": 1.2466, "step": 33557 }, { "epoch": 0.92, "learning_rate": 3.638149778715683e-07, "loss": 1.2693, "step": 33558 }, { "epoch": 0.92, "learning_rate": 3.6357860318651294e-07, "loss": 1.1919, "step": 33559 }, { "epoch": 0.92, "learning_rate": 3.6334230389228564e-07, "loss": 1.4272, "step": 33560 }, { "epoch": 0.92, "learning_rate": 3.631060799907382e-07, "loss": 1.1093, "step": 33561 }, { "epoch": 0.92, "learning_rate": 3.6286993148371694e-07, "loss": 1.2273, "step": 33562 }, { "epoch": 0.92, "learning_rate": 3.626338583730682e-07, "loss": 1.2834, "step": 33563 }, { "epoch": 0.92, "learning_rate": 3.6239786066064264e-07, "loss": 1.1108, "step": 33564 }, { "epoch": 0.92, "learning_rate": 3.6216193834828327e-07, "loss": 1.197, "step": 33565 }, { "epoch": 0.92, "learning_rate": 3.6192609143783754e-07, "loss": 1.4102, "step": 33566 }, { "epoch": 0.92, "learning_rate": 3.6169031993114835e-07, "loss": 1.1675, "step": 33567 }, { "epoch": 0.92, "learning_rate": 3.6145462383006316e-07, "loss": 1.1514, "step": 33568 }, { "epoch": 0.92, "learning_rate": 3.612190031364238e-07, "loss": 1.3167, "step": 33569 }, { "epoch": 0.92, "learning_rate": 3.6098345785207543e-07, "loss": 1.46, "step": 33570 }, { "epoch": 0.92, "learning_rate": 3.607479879788589e-07, "loss": 1.0527, "step": 33571 }, { "epoch": 0.92, "learning_rate": 3.6051259351861824e-07, "loss": 1.2295, "step": 33572 }, { "epoch": 0.92, "learning_rate": 3.6027727447319417e-07, "loss": 1.2607, "step": 33573 }, { "epoch": 0.92, "learning_rate": 3.6004203084442747e-07, "loss": 1.2139, "step": 33574 }, { "epoch": 0.92, "learning_rate": 3.598068626341578e-07, "loss": 1.2383, "step": 33575 }, { "epoch": 0.92, "learning_rate": 3.5957176984422805e-07, "loss": 1.2944, "step": 33576 }, { "epoch": 0.92, "learning_rate": 3.5933675247647457e-07, "loss": 1.1594, "step": 33577 }, { "epoch": 0.92, "learning_rate": 3.5910181053273595e-07, "loss": 1.3142, "step": 33578 }, { "epoch": 0.92, "learning_rate": 3.588669440148529e-07, "loss": 1.2292, "step": 33579 }, { "epoch": 0.92, "learning_rate": 3.586321529246606e-07, "loss": 1.1973, "step": 33580 }, { "epoch": 0.92, "learning_rate": 3.583974372639987e-07, "loss": 1.3164, "step": 33581 }, { "epoch": 0.92, "learning_rate": 3.581627970346979e-07, "loss": 1.1692, "step": 33582 }, { "epoch": 0.92, "learning_rate": 3.579282322386002e-07, "loss": 1.3, "step": 33583 }, { "epoch": 0.92, "learning_rate": 3.5769374287753624e-07, "loss": 1.2686, "step": 33584 }, { "epoch": 0.92, "learning_rate": 3.5745932895334455e-07, "loss": 1.1848, "step": 33585 }, { "epoch": 0.92, "learning_rate": 3.5722499046785374e-07, "loss": 1.2864, "step": 33586 }, { "epoch": 0.92, "learning_rate": 3.569907274229023e-07, "loss": 1.1692, "step": 33587 }, { "epoch": 0.92, "learning_rate": 3.567565398203199e-07, "loss": 1.2234, "step": 33588 }, { "epoch": 0.92, "learning_rate": 3.5652242766194167e-07, "loss": 1.1174, "step": 33589 }, { "epoch": 0.92, "learning_rate": 3.562883909495951e-07, "loss": 1.3423, "step": 33590 }, { "epoch": 0.92, "learning_rate": 3.560544296851143e-07, "loss": 1.2878, "step": 33591 }, { "epoch": 0.92, "learning_rate": 3.558205438703277e-07, "loss": 1.2195, "step": 33592 }, { "epoch": 0.92, "learning_rate": 3.555867335070684e-07, "loss": 1.3328, "step": 33593 }, { "epoch": 0.92, "learning_rate": 3.5535299859716155e-07, "loss": 1.1685, "step": 33594 }, { "epoch": 0.92, "learning_rate": 3.551193391424379e-07, "loss": 1.2476, "step": 33595 }, { "epoch": 0.92, "learning_rate": 3.54885755144726e-07, "loss": 1.2087, "step": 33596 }, { "epoch": 0.92, "learning_rate": 3.546522466058522e-07, "loss": 1.1199, "step": 33597 }, { "epoch": 0.92, "learning_rate": 3.544188135276438e-07, "loss": 1.1235, "step": 33598 }, { "epoch": 0.92, "learning_rate": 3.541854559119251e-07, "loss": 1.209, "step": 33599 }, { "epoch": 0.92, "learning_rate": 3.539521737605256e-07, "loss": 1.3774, "step": 33600 }, { "epoch": 0.92, "learning_rate": 3.5371896707526833e-07, "loss": 1.1401, "step": 33601 }, { "epoch": 0.92, "learning_rate": 3.5348583585797736e-07, "loss": 1.2593, "step": 33602 }, { "epoch": 0.92, "learning_rate": 3.532527801104768e-07, "loss": 1.3135, "step": 33603 }, { "epoch": 0.92, "learning_rate": 3.530197998345908e-07, "loss": 1.2905, "step": 33604 }, { "epoch": 0.92, "learning_rate": 3.5278689503214224e-07, "loss": 1.2417, "step": 33605 }, { "epoch": 0.92, "learning_rate": 3.52554065704952e-07, "loss": 1.313, "step": 33606 }, { "epoch": 0.92, "learning_rate": 3.5232131185484075e-07, "loss": 1.3877, "step": 33607 }, { "epoch": 0.92, "learning_rate": 3.5208863348363267e-07, "loss": 1.2217, "step": 33608 }, { "epoch": 0.92, "learning_rate": 3.518560305931451e-07, "loss": 1.2852, "step": 33609 }, { "epoch": 0.92, "learning_rate": 3.516235031851989e-07, "loss": 1.4019, "step": 33610 }, { "epoch": 0.92, "learning_rate": 3.513910512616148e-07, "loss": 1.4072, "step": 33611 }, { "epoch": 0.92, "learning_rate": 3.5115867482421016e-07, "loss": 1.2275, "step": 33612 }, { "epoch": 0.92, "learning_rate": 3.5092637387480256e-07, "loss": 1.418, "step": 33613 }, { "epoch": 0.92, "learning_rate": 3.5069414841520823e-07, "loss": 1.3511, "step": 33614 }, { "epoch": 0.92, "learning_rate": 3.504619984472468e-07, "loss": 1.2368, "step": 33615 }, { "epoch": 0.92, "learning_rate": 3.502299239727336e-07, "loss": 1.3003, "step": 33616 }, { "epoch": 0.92, "learning_rate": 3.4999792499348264e-07, "loss": 1.3921, "step": 33617 }, { "epoch": 0.92, "learning_rate": 3.4976600151131026e-07, "loss": 1.4006, "step": 33618 }, { "epoch": 0.92, "learning_rate": 3.4953415352803167e-07, "loss": 1.2734, "step": 33619 }, { "epoch": 0.92, "learning_rate": 3.493023810454599e-07, "loss": 1.0635, "step": 33620 }, { "epoch": 0.92, "learning_rate": 3.490706840654079e-07, "loss": 1.2993, "step": 33621 }, { "epoch": 0.92, "learning_rate": 3.488390625896876e-07, "loss": 1.3135, "step": 33622 }, { "epoch": 0.92, "learning_rate": 3.4860751662011307e-07, "loss": 1.3496, "step": 33623 }, { "epoch": 0.92, "learning_rate": 3.4837604615849506e-07, "loss": 1.2913, "step": 33624 }, { "epoch": 0.92, "learning_rate": 3.481446512066433e-07, "loss": 1.3242, "step": 33625 }, { "epoch": 0.92, "learning_rate": 3.4791333176637075e-07, "loss": 1.1924, "step": 33626 }, { "epoch": 0.92, "learning_rate": 3.4768208783948377e-07, "loss": 1.1248, "step": 33627 }, { "epoch": 0.92, "learning_rate": 3.4745091942779643e-07, "loss": 1.2432, "step": 33628 }, { "epoch": 0.92, "learning_rate": 3.472198265331117e-07, "loss": 1.3804, "step": 33629 }, { "epoch": 0.92, "learning_rate": 3.469888091572404e-07, "loss": 1.3833, "step": 33630 }, { "epoch": 0.92, "learning_rate": 3.467578673019889e-07, "loss": 1.1266, "step": 33631 }, { "epoch": 0.92, "learning_rate": 3.4652700096916683e-07, "loss": 1.4314, "step": 33632 }, { "epoch": 0.92, "learning_rate": 3.4629621016057493e-07, "loss": 1.3611, "step": 33633 }, { "epoch": 0.92, "learning_rate": 3.4606549487802396e-07, "loss": 1.4131, "step": 33634 }, { "epoch": 0.92, "learning_rate": 3.4583485512331593e-07, "loss": 1.3367, "step": 33635 }, { "epoch": 0.92, "learning_rate": 3.456042908982582e-07, "loss": 1.2517, "step": 33636 }, { "epoch": 0.92, "learning_rate": 3.4537380220465047e-07, "loss": 1.3025, "step": 33637 }, { "epoch": 0.92, "learning_rate": 3.4514338904430013e-07, "loss": 1.2615, "step": 33638 }, { "epoch": 0.92, "learning_rate": 3.449130514190058e-07, "loss": 1.2329, "step": 33639 }, { "epoch": 0.92, "learning_rate": 3.4468278933057265e-07, "loss": 1.2363, "step": 33640 }, { "epoch": 0.92, "learning_rate": 3.444526027808015e-07, "loss": 1.2754, "step": 33641 }, { "epoch": 0.92, "learning_rate": 3.4422249177149204e-07, "loss": 1.3284, "step": 33642 }, { "epoch": 0.92, "learning_rate": 3.439924563044461e-07, "loss": 1.1978, "step": 33643 }, { "epoch": 0.92, "learning_rate": 3.437624963814623e-07, "loss": 1.2458, "step": 33644 }, { "epoch": 0.92, "learning_rate": 3.435326120043403e-07, "loss": 1.1851, "step": 33645 }, { "epoch": 0.92, "learning_rate": 3.4330280317487754e-07, "loss": 1.2822, "step": 33646 }, { "epoch": 0.92, "learning_rate": 3.4307306989487366e-07, "loss": 1.2656, "step": 33647 }, { "epoch": 0.92, "learning_rate": 3.4284341216612503e-07, "loss": 1.1528, "step": 33648 }, { "epoch": 0.92, "learning_rate": 3.4261382999042804e-07, "loss": 1.147, "step": 33649 }, { "epoch": 0.92, "learning_rate": 3.4238432336957894e-07, "loss": 1.1924, "step": 33650 }, { "epoch": 0.92, "learning_rate": 3.421548923053741e-07, "loss": 1.2805, "step": 33651 }, { "epoch": 0.92, "learning_rate": 3.4192553679960773e-07, "loss": 1.123, "step": 33652 }, { "epoch": 0.92, "learning_rate": 3.4169625685407493e-07, "loss": 1.708, "step": 33653 }, { "epoch": 0.92, "learning_rate": 3.4146705247056767e-07, "loss": 1.2058, "step": 33654 }, { "epoch": 0.92, "learning_rate": 3.412379236508823e-07, "loss": 1.2158, "step": 33655 }, { "epoch": 0.92, "learning_rate": 3.410088703968084e-07, "loss": 1.2063, "step": 33656 }, { "epoch": 0.92, "learning_rate": 3.40779892710138e-07, "loss": 1.1313, "step": 33657 }, { "epoch": 0.92, "learning_rate": 3.4055099059266515e-07, "loss": 1.187, "step": 33658 }, { "epoch": 0.92, "learning_rate": 3.403221640461796e-07, "loss": 1.1523, "step": 33659 }, { "epoch": 0.92, "learning_rate": 3.400934130724709e-07, "loss": 1.2931, "step": 33660 }, { "epoch": 0.92, "learning_rate": 3.398647376733277e-07, "loss": 1.239, "step": 33661 }, { "epoch": 0.92, "learning_rate": 3.3963613785054083e-07, "loss": 1.3003, "step": 33662 }, { "epoch": 0.92, "learning_rate": 3.394076136058988e-07, "loss": 1.3691, "step": 33663 }, { "epoch": 0.92, "learning_rate": 3.3917916494118906e-07, "loss": 1.2905, "step": 33664 }, { "epoch": 0.92, "learning_rate": 3.389507918581969e-07, "loss": 1.2644, "step": 33665 }, { "epoch": 0.92, "learning_rate": 3.3872249435871194e-07, "loss": 1.3022, "step": 33666 }, { "epoch": 0.92, "learning_rate": 3.384942724445195e-07, "loss": 1.377, "step": 33667 }, { "epoch": 0.92, "learning_rate": 3.3826612611740475e-07, "loss": 1.4092, "step": 33668 }, { "epoch": 0.92, "learning_rate": 3.380380553791518e-07, "loss": 1.1462, "step": 33669 }, { "epoch": 0.92, "learning_rate": 3.3781006023154597e-07, "loss": 1.1482, "step": 33670 }, { "epoch": 0.92, "learning_rate": 3.375821406763713e-07, "loss": 1.2004, "step": 33671 }, { "epoch": 0.92, "learning_rate": 3.3735429671540975e-07, "loss": 1.2126, "step": 33672 }, { "epoch": 0.92, "learning_rate": 3.371265283504443e-07, "loss": 1.0513, "step": 33673 }, { "epoch": 0.92, "learning_rate": 3.36898835583257e-07, "loss": 1.1096, "step": 33674 }, { "epoch": 0.92, "learning_rate": 3.366712184156318e-07, "loss": 1.0355, "step": 33675 }, { "epoch": 0.92, "learning_rate": 3.36443676849344e-07, "loss": 1.2505, "step": 33676 }, { "epoch": 0.92, "learning_rate": 3.362162108861777e-07, "loss": 1.1794, "step": 33677 }, { "epoch": 0.92, "learning_rate": 3.3598882052791047e-07, "loss": 1.1755, "step": 33678 }, { "epoch": 0.92, "learning_rate": 3.357615057763253e-07, "loss": 1.3325, "step": 33679 }, { "epoch": 0.92, "learning_rate": 3.355342666331951e-07, "loss": 1.3691, "step": 33680 }, { "epoch": 0.92, "learning_rate": 3.353071031003008e-07, "loss": 1.2463, "step": 33681 }, { "epoch": 0.92, "learning_rate": 3.350800151794187e-07, "loss": 1.2986, "step": 33682 }, { "epoch": 0.92, "learning_rate": 3.3485300287232625e-07, "loss": 1.2577, "step": 33683 }, { "epoch": 0.92, "learning_rate": 3.3462606618079987e-07, "loss": 1.3308, "step": 33684 }, { "epoch": 0.92, "learning_rate": 3.343992051066136e-07, "loss": 1.1445, "step": 33685 }, { "epoch": 0.92, "learning_rate": 3.341724196515417e-07, "loss": 1.1233, "step": 33686 }, { "epoch": 0.92, "learning_rate": 3.3394570981736154e-07, "loss": 1.342, "step": 33687 }, { "epoch": 0.92, "learning_rate": 3.3371907560584395e-07, "loss": 1.2512, "step": 33688 }, { "epoch": 0.92, "learning_rate": 3.3349251701876197e-07, "loss": 1.1921, "step": 33689 }, { "epoch": 0.92, "learning_rate": 3.332660340578897e-07, "loss": 1.2166, "step": 33690 }, { "epoch": 0.92, "learning_rate": 3.330396267249991e-07, "loss": 1.2578, "step": 33691 }, { "epoch": 0.92, "learning_rate": 3.32813295021861e-07, "loss": 1.1404, "step": 33692 }, { "epoch": 0.92, "learning_rate": 3.325870389502439e-07, "loss": 1.0703, "step": 33693 }, { "epoch": 0.92, "learning_rate": 3.323608585119209e-07, "loss": 1.0674, "step": 33694 }, { "epoch": 0.92, "learning_rate": 3.321347537086617e-07, "loss": 1.1753, "step": 33695 }, { "epoch": 0.92, "learning_rate": 3.319087245422326e-07, "loss": 1.2585, "step": 33696 }, { "epoch": 0.92, "learning_rate": 3.316827710144033e-07, "loss": 1.145, "step": 33697 }, { "epoch": 0.92, "learning_rate": 3.314568931269424e-07, "loss": 1.323, "step": 33698 }, { "epoch": 0.92, "learning_rate": 3.312310908816163e-07, "loss": 1.2004, "step": 33699 }, { "epoch": 0.92, "learning_rate": 3.3100536428019137e-07, "loss": 1.2639, "step": 33700 }, { "epoch": 0.92, "learning_rate": 3.307797133244328e-07, "loss": 1.2842, "step": 33701 }, { "epoch": 0.92, "learning_rate": 3.3055413801610817e-07, "loss": 1.2327, "step": 33702 }, { "epoch": 0.92, "learning_rate": 3.3032863835698146e-07, "loss": 1.261, "step": 33703 }, { "epoch": 0.92, "learning_rate": 3.3010321434881477e-07, "loss": 1.2524, "step": 33704 }, { "epoch": 0.92, "learning_rate": 3.298778659933743e-07, "loss": 1.2708, "step": 33705 }, { "epoch": 0.92, "learning_rate": 3.296525932924233e-07, "loss": 1.385, "step": 33706 }, { "epoch": 0.92, "learning_rate": 3.2942739624772234e-07, "loss": 1.2866, "step": 33707 }, { "epoch": 0.92, "learning_rate": 3.292022748610324e-07, "loss": 1.2009, "step": 33708 }, { "epoch": 0.92, "learning_rate": 3.2897722913411753e-07, "loss": 1.1936, "step": 33709 }, { "epoch": 0.92, "learning_rate": 3.2875225906873865e-07, "loss": 1.2092, "step": 33710 }, { "epoch": 0.92, "learning_rate": 3.2852736466665316e-07, "loss": 1.2373, "step": 33711 }, { "epoch": 0.92, "learning_rate": 3.2830254592962074e-07, "loss": 1.3269, "step": 33712 }, { "epoch": 0.92, "learning_rate": 3.2807780285940225e-07, "loss": 1.2649, "step": 33713 }, { "epoch": 0.92, "learning_rate": 3.278531354577541e-07, "loss": 1.2888, "step": 33714 }, { "epoch": 0.92, "learning_rate": 3.2762854372643704e-07, "loss": 1.1638, "step": 33715 }, { "epoch": 0.92, "learning_rate": 3.274040276672041e-07, "loss": 1.2441, "step": 33716 }, { "epoch": 0.92, "learning_rate": 3.2717958728181287e-07, "loss": 1.1812, "step": 33717 }, { "epoch": 0.92, "learning_rate": 3.2695522257202183e-07, "loss": 1.1831, "step": 33718 }, { "epoch": 0.92, "learning_rate": 3.267309335395841e-07, "loss": 1.272, "step": 33719 }, { "epoch": 0.92, "learning_rate": 3.2650672018625486e-07, "loss": 1.248, "step": 33720 }, { "epoch": 0.92, "learning_rate": 3.262825825137872e-07, "loss": 1.3857, "step": 33721 }, { "epoch": 0.92, "learning_rate": 3.260585205239375e-07, "loss": 1.3708, "step": 33722 }, { "epoch": 0.92, "learning_rate": 3.2583453421845656e-07, "loss": 1.2483, "step": 33723 }, { "epoch": 0.92, "learning_rate": 3.2561062359909634e-07, "loss": 1.3115, "step": 33724 }, { "epoch": 0.92, "learning_rate": 3.2538678866760985e-07, "loss": 1.1675, "step": 33725 }, { "epoch": 0.92, "learning_rate": 3.2516302942574794e-07, "loss": 1.1357, "step": 33726 }, { "epoch": 0.92, "learning_rate": 3.249393458752603e-07, "loss": 1.1672, "step": 33727 }, { "epoch": 0.92, "learning_rate": 3.2471573801789893e-07, "loss": 1.3091, "step": 33728 }, { "epoch": 0.92, "learning_rate": 3.2449220585541007e-07, "loss": 1.3518, "step": 33729 }, { "epoch": 0.92, "learning_rate": 3.242687493895458e-07, "loss": 1.1741, "step": 33730 }, { "epoch": 0.92, "learning_rate": 3.240453686220535e-07, "loss": 1.7539, "step": 33731 }, { "epoch": 0.92, "learning_rate": 3.238220635546796e-07, "loss": 1.2991, "step": 33732 }, { "epoch": 0.92, "learning_rate": 3.235988341891716e-07, "loss": 1.301, "step": 33733 }, { "epoch": 0.92, "learning_rate": 3.2337568052727587e-07, "loss": 1.4502, "step": 33734 }, { "epoch": 0.92, "learning_rate": 3.231526025707399e-07, "loss": 1.1958, "step": 33735 }, { "epoch": 0.92, "learning_rate": 3.229296003213056e-07, "loss": 1.0894, "step": 33736 }, { "epoch": 0.92, "learning_rate": 3.227066737807216e-07, "loss": 1.3447, "step": 33737 }, { "epoch": 0.92, "learning_rate": 3.224838229507288e-07, "loss": 1.3792, "step": 33738 }, { "epoch": 0.92, "learning_rate": 3.222610478330723e-07, "loss": 1.4094, "step": 33739 }, { "epoch": 0.92, "learning_rate": 3.2203834842949423e-07, "loss": 1.3303, "step": 33740 }, { "epoch": 0.92, "learning_rate": 3.218157247417375e-07, "loss": 1.3347, "step": 33741 }, { "epoch": 0.92, "learning_rate": 3.215931767715441e-07, "loss": 1.2859, "step": 33742 }, { "epoch": 0.92, "learning_rate": 3.2137070452065377e-07, "loss": 1.2759, "step": 33743 }, { "epoch": 0.92, "learning_rate": 3.211483079908073e-07, "loss": 1.0691, "step": 33744 }, { "epoch": 0.92, "learning_rate": 3.209259871837467e-07, "loss": 1.2876, "step": 33745 }, { "epoch": 0.92, "learning_rate": 3.2070374210120935e-07, "loss": 1.144, "step": 33746 }, { "epoch": 0.92, "learning_rate": 3.20481572744934e-07, "loss": 1.3396, "step": 33747 }, { "epoch": 0.92, "learning_rate": 3.202594791166591e-07, "loss": 1.2322, "step": 33748 }, { "epoch": 0.92, "learning_rate": 3.200374612181212e-07, "loss": 1.3569, "step": 33749 }, { "epoch": 0.92, "learning_rate": 3.19815519051061e-07, "loss": 1.1249, "step": 33750 }, { "epoch": 0.92, "learning_rate": 3.1959365261721055e-07, "loss": 1.3767, "step": 33751 }, { "epoch": 0.92, "learning_rate": 3.193718619183073e-07, "loss": 1.3271, "step": 33752 }, { "epoch": 0.92, "learning_rate": 3.191501469560865e-07, "loss": 1.2598, "step": 33753 }, { "epoch": 0.92, "learning_rate": 3.1892850773228343e-07, "loss": 1.2334, "step": 33754 }, { "epoch": 0.92, "learning_rate": 3.187069442486301e-07, "loss": 1.2373, "step": 33755 }, { "epoch": 0.92, "learning_rate": 3.184854565068629e-07, "loss": 1.2043, "step": 33756 }, { "epoch": 0.92, "learning_rate": 3.182640445087104e-07, "loss": 1.3459, "step": 33757 }, { "epoch": 0.92, "learning_rate": 3.180427082559112e-07, "loss": 1.26, "step": 33758 }, { "epoch": 0.92, "learning_rate": 3.1782144775018953e-07, "loss": 1.2942, "step": 33759 }, { "epoch": 0.92, "learning_rate": 3.1760026299328174e-07, "loss": 1.3843, "step": 33760 }, { "epoch": 0.92, "learning_rate": 3.173791539869153e-07, "loss": 1.3032, "step": 33761 }, { "epoch": 0.92, "learning_rate": 3.171581207328234e-07, "loss": 1.3008, "step": 33762 }, { "epoch": 0.92, "learning_rate": 3.1693716323273004e-07, "loss": 1.171, "step": 33763 }, { "epoch": 0.92, "learning_rate": 3.1671628148836844e-07, "loss": 1.1169, "step": 33764 }, { "epoch": 0.92, "learning_rate": 3.1649547550146596e-07, "loss": 1.1672, "step": 33765 }, { "epoch": 0.92, "learning_rate": 3.162747452737491e-07, "loss": 1.2949, "step": 33766 }, { "epoch": 0.92, "learning_rate": 3.1605409080694535e-07, "loss": 1.3562, "step": 33767 }, { "epoch": 0.92, "learning_rate": 3.158335121027789e-07, "loss": 1.2046, "step": 33768 }, { "epoch": 0.92, "learning_rate": 3.156130091629794e-07, "loss": 1.1663, "step": 33769 }, { "epoch": 0.92, "learning_rate": 3.153925819892689e-07, "loss": 1.2971, "step": 33770 }, { "epoch": 0.92, "learning_rate": 3.1517223058337263e-07, "loss": 1.353, "step": 33771 }, { "epoch": 0.92, "learning_rate": 3.149519549470148e-07, "loss": 1.8345, "step": 33772 }, { "epoch": 0.92, "learning_rate": 3.1473175508191844e-07, "loss": 1.2502, "step": 33773 }, { "epoch": 0.92, "learning_rate": 3.145116309898078e-07, "loss": 1.3804, "step": 33774 }, { "epoch": 0.92, "learning_rate": 3.1429158267240245e-07, "loss": 1.2915, "step": 33775 }, { "epoch": 0.92, "learning_rate": 3.140716101314256e-07, "loss": 1.2842, "step": 33776 }, { "epoch": 0.92, "learning_rate": 3.1385171336859696e-07, "loss": 1.3105, "step": 33777 }, { "epoch": 0.92, "learning_rate": 3.136318923856396e-07, "loss": 1.3201, "step": 33778 }, { "epoch": 0.92, "learning_rate": 3.1341214718426885e-07, "loss": 1.2512, "step": 33779 }, { "epoch": 0.92, "learning_rate": 3.1319247776620875e-07, "loss": 1.7114, "step": 33780 }, { "epoch": 0.92, "learning_rate": 3.129728841331758e-07, "loss": 1.2219, "step": 33781 }, { "epoch": 0.92, "learning_rate": 3.127533662868865e-07, "loss": 1.3789, "step": 33782 }, { "epoch": 0.92, "learning_rate": 3.1253392422905926e-07, "loss": 1.1006, "step": 33783 }, { "epoch": 0.92, "learning_rate": 3.1231455796141287e-07, "loss": 1.4004, "step": 33784 }, { "epoch": 0.92, "learning_rate": 3.1209526748566146e-07, "loss": 1.2754, "step": 33785 }, { "epoch": 0.92, "learning_rate": 3.118760528035214e-07, "loss": 1.175, "step": 33786 }, { "epoch": 0.92, "learning_rate": 3.1165691391670585e-07, "loss": 1.3474, "step": 33787 }, { "epoch": 0.92, "learning_rate": 3.1143785082693224e-07, "loss": 1.2686, "step": 33788 }, { "epoch": 0.92, "learning_rate": 3.1121886353591257e-07, "loss": 1.1326, "step": 33789 }, { "epoch": 0.92, "learning_rate": 3.1099995204535994e-07, "loss": 1.25, "step": 33790 }, { "epoch": 0.92, "learning_rate": 3.107811163569874e-07, "loss": 1.3315, "step": 33791 }, { "epoch": 0.92, "learning_rate": 3.105623564725091e-07, "loss": 1.2361, "step": 33792 }, { "epoch": 0.92, "learning_rate": 3.103436723936337e-07, "loss": 1.2781, "step": 33793 }, { "epoch": 0.92, "learning_rate": 3.101250641220732e-07, "loss": 1.3381, "step": 33794 }, { "epoch": 0.92, "learning_rate": 3.0990653165953624e-07, "loss": 1.2583, "step": 33795 }, { "epoch": 0.92, "learning_rate": 3.096880750077336e-07, "loss": 1.1582, "step": 33796 }, { "epoch": 0.92, "learning_rate": 3.094696941683784e-07, "loss": 1.1982, "step": 33797 }, { "epoch": 0.92, "learning_rate": 3.0925138914317255e-07, "loss": 1.3423, "step": 33798 }, { "epoch": 0.92, "learning_rate": 3.0903315993382696e-07, "loss": 1.3257, "step": 33799 }, { "epoch": 0.92, "learning_rate": 3.0881500654204923e-07, "loss": 1.3604, "step": 33800 }, { "epoch": 0.92, "learning_rate": 3.0859692896954787e-07, "loss": 1.2722, "step": 33801 }, { "epoch": 0.92, "learning_rate": 3.083789272180238e-07, "loss": 1.0957, "step": 33802 }, { "epoch": 0.92, "learning_rate": 3.081610012891878e-07, "loss": 1.292, "step": 33803 }, { "epoch": 0.92, "learning_rate": 3.0794315118474084e-07, "loss": 1.334, "step": 33804 }, { "epoch": 0.92, "learning_rate": 3.077253769063915e-07, "loss": 1.0486, "step": 33805 }, { "epoch": 0.92, "learning_rate": 3.075076784558395e-07, "loss": 1.3787, "step": 33806 }, { "epoch": 0.92, "learning_rate": 3.0729005583479023e-07, "loss": 1.3809, "step": 33807 }, { "epoch": 0.92, "learning_rate": 3.070725090449456e-07, "loss": 1.2368, "step": 33808 }, { "epoch": 0.92, "learning_rate": 3.0685503808800866e-07, "loss": 1.1724, "step": 33809 }, { "epoch": 0.92, "learning_rate": 3.066376429656781e-07, "loss": 1.3303, "step": 33810 }, { "epoch": 0.92, "learning_rate": 3.0642032367965703e-07, "loss": 1.1255, "step": 33811 }, { "epoch": 0.92, "learning_rate": 3.062030802316451e-07, "loss": 1.2798, "step": 33812 }, { "epoch": 0.92, "learning_rate": 3.059859126233433e-07, "loss": 1.3672, "step": 33813 }, { "epoch": 0.92, "learning_rate": 3.05768820856448e-07, "loss": 1.2451, "step": 33814 }, { "epoch": 0.92, "learning_rate": 3.055518049326589e-07, "loss": 1.2166, "step": 33815 }, { "epoch": 0.92, "learning_rate": 3.053348648536736e-07, "loss": 1.2776, "step": 33816 }, { "epoch": 0.92, "learning_rate": 3.051180006211907e-07, "loss": 1.3245, "step": 33817 }, { "epoch": 0.92, "learning_rate": 3.049012122369055e-07, "loss": 1.1477, "step": 33818 }, { "epoch": 0.92, "learning_rate": 3.0468449970251336e-07, "loss": 1.2654, "step": 33819 }, { "epoch": 0.92, "learning_rate": 3.0446786301971067e-07, "loss": 1.261, "step": 33820 }, { "epoch": 0.92, "learning_rate": 3.042513021901927e-07, "loss": 1.1033, "step": 33821 }, { "epoch": 0.92, "learning_rate": 3.0403481721565375e-07, "loss": 1.134, "step": 33822 }, { "epoch": 0.92, "learning_rate": 3.0381840809778574e-07, "loss": 1.2046, "step": 33823 }, { "epoch": 0.92, "learning_rate": 3.0360207483828394e-07, "loss": 1.2747, "step": 33824 }, { "epoch": 0.92, "learning_rate": 3.0338581743884045e-07, "loss": 1.2329, "step": 33825 }, { "epoch": 0.92, "learning_rate": 3.03169635901146e-07, "loss": 1.366, "step": 33826 }, { "epoch": 0.92, "learning_rate": 3.0295353022689264e-07, "loss": 1.3267, "step": 33827 }, { "epoch": 0.92, "learning_rate": 3.0273750041777127e-07, "loss": 1.1147, "step": 33828 }, { "epoch": 0.92, "learning_rate": 3.025215464754716e-07, "loss": 1.0793, "step": 33829 }, { "epoch": 0.92, "learning_rate": 3.023056684016823e-07, "loss": 1.2053, "step": 33830 }, { "epoch": 0.92, "learning_rate": 3.0208986619809424e-07, "loss": 1.2209, "step": 33831 }, { "epoch": 0.92, "learning_rate": 3.018741398663949e-07, "loss": 1.2532, "step": 33832 }, { "epoch": 0.92, "learning_rate": 3.0165848940827193e-07, "loss": 1.2263, "step": 33833 }, { "epoch": 0.92, "learning_rate": 3.0144291482541054e-07, "loss": 1.1973, "step": 33834 }, { "epoch": 0.92, "learning_rate": 3.012274161195017e-07, "loss": 1.302, "step": 33835 }, { "epoch": 0.92, "learning_rate": 3.0101199329222843e-07, "loss": 1.4385, "step": 33836 }, { "epoch": 0.92, "learning_rate": 3.0079664634527604e-07, "loss": 1.3115, "step": 33837 }, { "epoch": 0.92, "learning_rate": 3.005813752803288e-07, "loss": 1.2207, "step": 33838 }, { "epoch": 0.92, "learning_rate": 3.0036618009907315e-07, "loss": 1.73, "step": 33839 }, { "epoch": 0.92, "learning_rate": 3.0015106080319214e-07, "loss": 1.334, "step": 33840 }, { "epoch": 0.92, "learning_rate": 2.999360173943655e-07, "loss": 1.2668, "step": 33841 }, { "epoch": 0.92, "learning_rate": 2.9972104987428087e-07, "loss": 1.1951, "step": 33842 }, { "epoch": 0.92, "learning_rate": 2.995061582446146e-07, "loss": 1.2029, "step": 33843 }, { "epoch": 0.92, "learning_rate": 2.992913425070543e-07, "loss": 1.2163, "step": 33844 }, { "epoch": 0.92, "learning_rate": 2.990766026632741e-07, "loss": 1.2871, "step": 33845 }, { "epoch": 0.92, "learning_rate": 2.988619387149583e-07, "loss": 1.4392, "step": 33846 }, { "epoch": 0.92, "learning_rate": 2.9864735066378326e-07, "loss": 1.0935, "step": 33847 }, { "epoch": 0.92, "learning_rate": 2.984328385114321e-07, "loss": 1.1702, "step": 33848 }, { "epoch": 0.92, "learning_rate": 2.9821840225957796e-07, "loss": 1.0967, "step": 33849 }, { "epoch": 0.92, "learning_rate": 2.9800404190990173e-07, "loss": 1.182, "step": 33850 }, { "epoch": 0.92, "learning_rate": 2.977897574640787e-07, "loss": 1.2559, "step": 33851 }, { "epoch": 0.92, "learning_rate": 2.975755489237886e-07, "loss": 1.3035, "step": 33852 }, { "epoch": 0.92, "learning_rate": 2.9736141629070347e-07, "loss": 1.2175, "step": 33853 }, { "epoch": 0.92, "learning_rate": 2.9714735956650086e-07, "loss": 1.1729, "step": 33854 }, { "epoch": 0.92, "learning_rate": 2.9693337875285275e-07, "loss": 1.3342, "step": 33855 }, { "epoch": 0.92, "learning_rate": 2.9671947385143897e-07, "loss": 1.6577, "step": 33856 }, { "epoch": 0.92, "learning_rate": 2.965056448639259e-07, "loss": 1.2671, "step": 33857 }, { "epoch": 0.92, "learning_rate": 2.9629189179198993e-07, "loss": 1.2727, "step": 33858 }, { "epoch": 0.92, "learning_rate": 2.960782146373042e-07, "loss": 1.1245, "step": 33859 }, { "epoch": 0.92, "learning_rate": 2.9586461340153974e-07, "loss": 1.281, "step": 33860 }, { "epoch": 0.92, "learning_rate": 2.9565108808636724e-07, "loss": 1.1963, "step": 33861 }, { "epoch": 0.92, "learning_rate": 2.9543763869345546e-07, "loss": 1.3401, "step": 33862 }, { "epoch": 0.92, "learning_rate": 2.9522426522447853e-07, "loss": 1.7107, "step": 33863 }, { "epoch": 0.92, "learning_rate": 2.9501096768110306e-07, "loss": 1.1714, "step": 33864 }, { "epoch": 0.92, "learning_rate": 2.9479774606499755e-07, "loss": 1.1895, "step": 33865 }, { "epoch": 0.92, "learning_rate": 2.945846003778308e-07, "loss": 1.0621, "step": 33866 }, { "epoch": 0.92, "learning_rate": 2.9437153062127024e-07, "loss": 1.0574, "step": 33867 }, { "epoch": 0.92, "learning_rate": 2.941585367969835e-07, "loss": 1.4062, "step": 33868 }, { "epoch": 0.92, "learning_rate": 2.9394561890663584e-07, "loss": 1.1445, "step": 33869 }, { "epoch": 0.92, "learning_rate": 2.9373277695189386e-07, "loss": 1.3186, "step": 33870 }, { "epoch": 0.92, "learning_rate": 2.9352001093442163e-07, "loss": 1.1162, "step": 33871 }, { "epoch": 0.93, "learning_rate": 2.9330732085588565e-07, "loss": 1.2554, "step": 33872 }, { "epoch": 0.93, "learning_rate": 2.9309470671794794e-07, "loss": 1.3616, "step": 33873 }, { "epoch": 0.93, "learning_rate": 2.9288216852227267e-07, "loss": 1.2532, "step": 33874 }, { "epoch": 0.93, "learning_rate": 2.9266970627052414e-07, "loss": 1.2717, "step": 33875 }, { "epoch": 0.93, "learning_rate": 2.9245731996436213e-07, "loss": 1.7407, "step": 33876 }, { "epoch": 0.93, "learning_rate": 2.9224500960544855e-07, "loss": 1.3179, "step": 33877 }, { "epoch": 0.93, "learning_rate": 2.920327751954455e-07, "loss": 1.3147, "step": 33878 }, { "epoch": 0.93, "learning_rate": 2.918206167360138e-07, "loss": 1.1936, "step": 33879 }, { "epoch": 0.93, "learning_rate": 2.9160853422881216e-07, "loss": 1.2659, "step": 33880 }, { "epoch": 0.93, "learning_rate": 2.9139652767549933e-07, "loss": 1.3401, "step": 33881 }, { "epoch": 0.93, "learning_rate": 2.9118459707773607e-07, "loss": 1.4297, "step": 33882 }, { "epoch": 0.93, "learning_rate": 2.9097274243717886e-07, "loss": 1.3379, "step": 33883 }, { "epoch": 0.93, "learning_rate": 2.9076096375548535e-07, "loss": 1.2375, "step": 33884 }, { "epoch": 0.93, "learning_rate": 2.905492610343108e-07, "loss": 1.1924, "step": 33885 }, { "epoch": 0.93, "learning_rate": 2.90337634275315e-07, "loss": 1.1052, "step": 33886 }, { "epoch": 0.93, "learning_rate": 2.9012608348015116e-07, "loss": 1.0994, "step": 33887 }, { "epoch": 0.93, "learning_rate": 2.8991460865047447e-07, "loss": 1.3433, "step": 33888 }, { "epoch": 0.93, "learning_rate": 2.8970320978794044e-07, "loss": 1.199, "step": 33889 }, { "epoch": 0.93, "learning_rate": 2.894918868942009e-07, "loss": 1.4712, "step": 33890 }, { "epoch": 0.93, "learning_rate": 2.892806399709136e-07, "loss": 1.166, "step": 33891 }, { "epoch": 0.93, "learning_rate": 2.89069469019726e-07, "loss": 1.1982, "step": 33892 }, { "epoch": 0.93, "learning_rate": 2.8885837404229345e-07, "loss": 1.2419, "step": 33893 }, { "epoch": 0.93, "learning_rate": 2.8864735504026574e-07, "loss": 1.3569, "step": 33894 }, { "epoch": 0.93, "learning_rate": 2.8843641201529605e-07, "loss": 1.2537, "step": 33895 }, { "epoch": 0.93, "learning_rate": 2.8822554496903186e-07, "loss": 1.2878, "step": 33896 }, { "epoch": 0.93, "learning_rate": 2.880147539031242e-07, "loss": 1.344, "step": 33897 }, { "epoch": 0.93, "learning_rate": 2.878040388192216e-07, "loss": 1.2388, "step": 33898 }, { "epoch": 0.93, "learning_rate": 2.8759339971897617e-07, "loss": 1.1963, "step": 33899 }, { "epoch": 0.93, "learning_rate": 2.873828366040299e-07, "loss": 1.3188, "step": 33900 }, { "epoch": 0.93, "learning_rate": 2.871723494760337e-07, "loss": 1.1514, "step": 33901 }, { "epoch": 0.93, "learning_rate": 2.86961938336634e-07, "loss": 1.2961, "step": 33902 }, { "epoch": 0.93, "learning_rate": 2.867516031874773e-07, "loss": 1.2903, "step": 33903 }, { "epoch": 0.93, "learning_rate": 2.865413440302078e-07, "loss": 1.2954, "step": 33904 }, { "epoch": 0.93, "learning_rate": 2.8633116086647095e-07, "loss": 1.302, "step": 33905 }, { "epoch": 0.93, "learning_rate": 2.86121053697912e-07, "loss": 1.0957, "step": 33906 }, { "epoch": 0.93, "learning_rate": 2.859110225261741e-07, "loss": 1.2576, "step": 33907 }, { "epoch": 0.93, "learning_rate": 2.857010673529015e-07, "loss": 1.2971, "step": 33908 }, { "epoch": 0.93, "learning_rate": 2.854911881797329e-07, "loss": 1.6499, "step": 33909 }, { "epoch": 0.93, "learning_rate": 2.852813850083158e-07, "loss": 1.2512, "step": 33910 }, { "epoch": 0.93, "learning_rate": 2.850716578402879e-07, "loss": 1.2295, "step": 33911 }, { "epoch": 0.93, "learning_rate": 2.8486200667729225e-07, "loss": 1.2229, "step": 33912 }, { "epoch": 0.93, "learning_rate": 2.846524315209664e-07, "loss": 1.2537, "step": 33913 }, { "epoch": 0.93, "learning_rate": 2.844429323729514e-07, "loss": 1.1917, "step": 33914 }, { "epoch": 0.93, "learning_rate": 2.8423350923488803e-07, "loss": 1.3364, "step": 33915 }, { "epoch": 0.93, "learning_rate": 2.840241621084117e-07, "loss": 1.2847, "step": 33916 }, { "epoch": 0.93, "learning_rate": 2.83814890995161e-07, "loss": 1.2551, "step": 33917 }, { "epoch": 0.93, "learning_rate": 2.836056958967748e-07, "loss": 1.1206, "step": 33918 }, { "epoch": 0.93, "learning_rate": 2.833965768148883e-07, "loss": 1.1072, "step": 33919 }, { "epoch": 0.93, "learning_rate": 2.8318753375113694e-07, "loss": 1.1936, "step": 33920 }, { "epoch": 0.93, "learning_rate": 2.829785667071594e-07, "loss": 1.1807, "step": 33921 }, { "epoch": 0.93, "learning_rate": 2.8276967568458656e-07, "loss": 1.1921, "step": 33922 }, { "epoch": 0.93, "learning_rate": 2.8256086068505495e-07, "loss": 1.3091, "step": 33923 }, { "epoch": 0.93, "learning_rate": 2.8235212171019763e-07, "loss": 1.2556, "step": 33924 }, { "epoch": 0.93, "learning_rate": 2.8214345876164785e-07, "loss": 1.2522, "step": 33925 }, { "epoch": 0.93, "learning_rate": 2.819348718410386e-07, "loss": 1.2778, "step": 33926 }, { "epoch": 0.93, "learning_rate": 2.817263609499998e-07, "loss": 1.2869, "step": 33927 }, { "epoch": 0.93, "learning_rate": 2.815179260901646e-07, "loss": 1.2544, "step": 33928 }, { "epoch": 0.93, "learning_rate": 2.813095672631638e-07, "loss": 1.2578, "step": 33929 }, { "epoch": 0.93, "learning_rate": 2.811012844706262e-07, "loss": 1.1047, "step": 33930 }, { "epoch": 0.93, "learning_rate": 2.808930777141827e-07, "loss": 1.3792, "step": 33931 }, { "epoch": 0.93, "learning_rate": 2.806849469954598e-07, "loss": 1.0479, "step": 33932 }, { "epoch": 0.93, "learning_rate": 2.8047689231608944e-07, "loss": 1.2673, "step": 33933 }, { "epoch": 0.93, "learning_rate": 2.8026891367769707e-07, "loss": 1.3794, "step": 33934 }, { "epoch": 0.93, "learning_rate": 2.800610110819091e-07, "loss": 1.2937, "step": 33935 }, { "epoch": 0.93, "learning_rate": 2.7985318453035424e-07, "loss": 1.179, "step": 33936 }, { "epoch": 0.93, "learning_rate": 2.796454340246568e-07, "loss": 1.1646, "step": 33937 }, { "epoch": 0.93, "learning_rate": 2.794377595664444e-07, "loss": 1.3171, "step": 33938 }, { "epoch": 0.93, "learning_rate": 2.792301611573367e-07, "loss": 1.2732, "step": 33939 }, { "epoch": 0.93, "learning_rate": 2.790226387989636e-07, "loss": 1.1362, "step": 33940 }, { "epoch": 0.93, "learning_rate": 2.78815192492945e-07, "loss": 1.6777, "step": 33941 }, { "epoch": 0.93, "learning_rate": 2.786078222409072e-07, "loss": 1.3499, "step": 33942 }, { "epoch": 0.93, "learning_rate": 2.784005280444679e-07, "loss": 1.2034, "step": 33943 }, { "epoch": 0.93, "learning_rate": 2.781933099052536e-07, "loss": 1.3765, "step": 33944 }, { "epoch": 0.93, "learning_rate": 2.7798616782488074e-07, "loss": 1.3789, "step": 33945 }, { "epoch": 0.93, "learning_rate": 2.777791018049747e-07, "loss": 1.2544, "step": 33946 }, { "epoch": 0.93, "learning_rate": 2.7757211184715307e-07, "loss": 1.3035, "step": 33947 }, { "epoch": 0.93, "learning_rate": 2.773651979530356e-07, "loss": 1.3369, "step": 33948 }, { "epoch": 0.93, "learning_rate": 2.7715836012423894e-07, "loss": 1.1158, "step": 33949 }, { "epoch": 0.93, "learning_rate": 2.7695159836238497e-07, "loss": 1.3284, "step": 33950 }, { "epoch": 0.93, "learning_rate": 2.7674491266909023e-07, "loss": 1.1589, "step": 33951 }, { "epoch": 0.93, "learning_rate": 2.7653830304596895e-07, "loss": 1.2156, "step": 33952 }, { "epoch": 0.93, "learning_rate": 2.7633176949464103e-07, "loss": 1.2699, "step": 33953 }, { "epoch": 0.93, "learning_rate": 2.7612531201672177e-07, "loss": 1.1699, "step": 33954 }, { "epoch": 0.93, "learning_rate": 2.759189306138244e-07, "loss": 1.2053, "step": 33955 }, { "epoch": 0.93, "learning_rate": 2.7571262528756416e-07, "loss": 1.3342, "step": 33956 }, { "epoch": 0.93, "learning_rate": 2.7550639603955656e-07, "loss": 1.3325, "step": 33957 }, { "epoch": 0.93, "learning_rate": 2.7530024287141465e-07, "loss": 1.3547, "step": 33958 }, { "epoch": 0.93, "learning_rate": 2.750941657847506e-07, "loss": 1.2419, "step": 33959 }, { "epoch": 0.93, "learning_rate": 2.748881647811752e-07, "loss": 1.2632, "step": 33960 }, { "epoch": 0.93, "learning_rate": 2.7468223986230394e-07, "loss": 1.197, "step": 33961 }, { "epoch": 0.93, "learning_rate": 2.7447639102974435e-07, "loss": 1.2327, "step": 33962 }, { "epoch": 0.93, "learning_rate": 2.742706182851085e-07, "loss": 1.2893, "step": 33963 }, { "epoch": 0.93, "learning_rate": 2.7406492163000507e-07, "loss": 1.1956, "step": 33964 }, { "epoch": 0.93, "learning_rate": 2.738593010660462e-07, "loss": 1.1316, "step": 33965 }, { "epoch": 0.93, "learning_rate": 2.736537565948372e-07, "loss": 1.3228, "step": 33966 }, { "epoch": 0.93, "learning_rate": 2.7344828821798783e-07, "loss": 1.2734, "step": 33967 }, { "epoch": 0.93, "learning_rate": 2.7324289593710473e-07, "loss": 1.2395, "step": 33968 }, { "epoch": 0.93, "learning_rate": 2.730375797537965e-07, "loss": 1.3047, "step": 33969 }, { "epoch": 0.93, "learning_rate": 2.728323396696686e-07, "loss": 1.3579, "step": 33970 }, { "epoch": 0.93, "learning_rate": 2.726271756863252e-07, "loss": 1.2134, "step": 33971 }, { "epoch": 0.93, "learning_rate": 2.7242208780537296e-07, "loss": 1.3113, "step": 33972 }, { "epoch": 0.93, "learning_rate": 2.7221707602841596e-07, "loss": 1.2966, "step": 33973 }, { "epoch": 0.93, "learning_rate": 2.720121403570597e-07, "loss": 1.3286, "step": 33974 }, { "epoch": 0.93, "learning_rate": 2.7180728079290397e-07, "loss": 1.2769, "step": 33975 }, { "epoch": 0.93, "learning_rate": 2.7160249733755415e-07, "loss": 1.3394, "step": 33976 }, { "epoch": 0.93, "learning_rate": 2.7139778999261126e-07, "loss": 1.3977, "step": 33977 }, { "epoch": 0.93, "learning_rate": 2.7119315875967945e-07, "loss": 1.2979, "step": 33978 }, { "epoch": 0.93, "learning_rate": 2.709886036403553e-07, "loss": 1.2612, "step": 33979 }, { "epoch": 0.93, "learning_rate": 2.7078412463624305e-07, "loss": 1.2822, "step": 33980 }, { "epoch": 0.93, "learning_rate": 2.705797217489392e-07, "loss": 1.3552, "step": 33981 }, { "epoch": 0.93, "learning_rate": 2.7037539498004585e-07, "loss": 1.0969, "step": 33982 }, { "epoch": 0.93, "learning_rate": 2.7017114433116056e-07, "loss": 1.1965, "step": 33983 }, { "epoch": 0.93, "learning_rate": 2.6996696980387873e-07, "loss": 1.3132, "step": 33984 }, { "epoch": 0.93, "learning_rate": 2.697628713998024e-07, "loss": 1.2803, "step": 33985 }, { "epoch": 0.93, "learning_rate": 2.695588491205248e-07, "loss": 1.282, "step": 33986 }, { "epoch": 0.93, "learning_rate": 2.6935490296764346e-07, "loss": 1.1809, "step": 33987 }, { "epoch": 0.93, "learning_rate": 2.691510329427527e-07, "loss": 1.2212, "step": 33988 }, { "epoch": 0.93, "learning_rate": 2.689472390474501e-07, "loss": 1.335, "step": 33989 }, { "epoch": 0.93, "learning_rate": 2.6874352128332783e-07, "loss": 1.2437, "step": 33990 }, { "epoch": 0.93, "learning_rate": 2.6853987965198003e-07, "loss": 1.2478, "step": 33991 }, { "epoch": 0.93, "learning_rate": 2.683363141549988e-07, "loss": 1.1746, "step": 33992 }, { "epoch": 0.93, "learning_rate": 2.681328247939807e-07, "loss": 1.2065, "step": 33993 }, { "epoch": 0.93, "learning_rate": 2.6792941157051446e-07, "loss": 1.4067, "step": 33994 }, { "epoch": 0.93, "learning_rate": 2.677260744861909e-07, "loss": 1.2314, "step": 33995 }, { "epoch": 0.93, "learning_rate": 2.6752281354260225e-07, "loss": 1.6528, "step": 33996 }, { "epoch": 0.93, "learning_rate": 2.6731962874133934e-07, "loss": 1.1016, "step": 33997 }, { "epoch": 0.93, "learning_rate": 2.67116520083992e-07, "loss": 1.1793, "step": 33998 }, { "epoch": 0.93, "learning_rate": 2.6691348757214576e-07, "loss": 1.3137, "step": 33999 }, { "epoch": 0.93, "learning_rate": 2.6671053120739364e-07, "loss": 1.2527, "step": 34000 }, { "epoch": 0.93, "learning_rate": 2.6650765099132117e-07, "loss": 1.2551, "step": 34001 }, { "epoch": 0.93, "learning_rate": 2.6630484692551584e-07, "loss": 1.3215, "step": 34002 }, { "epoch": 0.93, "learning_rate": 2.6610211901156204e-07, "loss": 1.3193, "step": 34003 }, { "epoch": 0.93, "learning_rate": 2.6589946725105066e-07, "loss": 1.2979, "step": 34004 }, { "epoch": 0.93, "learning_rate": 2.656968916455638e-07, "loss": 1.1891, "step": 34005 }, { "epoch": 0.93, "learning_rate": 2.6549439219668796e-07, "loss": 1.3547, "step": 34006 }, { "epoch": 0.93, "learning_rate": 2.652919689060041e-07, "loss": 1.6123, "step": 34007 }, { "epoch": 0.93, "learning_rate": 2.650896217750998e-07, "loss": 1.146, "step": 34008 }, { "epoch": 0.93, "learning_rate": 2.6488735080555714e-07, "loss": 1.3767, "step": 34009 }, { "epoch": 0.93, "learning_rate": 2.646851559989583e-07, "loss": 1.0981, "step": 34010 }, { "epoch": 0.93, "learning_rate": 2.64483037356883e-07, "loss": 1.1677, "step": 34011 }, { "epoch": 0.93, "learning_rate": 2.642809948809144e-07, "loss": 1.1965, "step": 34012 }, { "epoch": 0.93, "learning_rate": 2.6407902857263576e-07, "loss": 1.178, "step": 34013 }, { "epoch": 0.93, "learning_rate": 2.6387713843362364e-07, "loss": 1.3901, "step": 34014 }, { "epoch": 0.93, "learning_rate": 2.6367532446545775e-07, "loss": 1.1951, "step": 34015 }, { "epoch": 0.93, "learning_rate": 2.63473586669718e-07, "loss": 1.2261, "step": 34016 }, { "epoch": 0.93, "learning_rate": 2.6327192504798314e-07, "loss": 1.2312, "step": 34017 }, { "epoch": 0.93, "learning_rate": 2.630703396018297e-07, "loss": 1.2615, "step": 34018 }, { "epoch": 0.93, "learning_rate": 2.6286883033283526e-07, "loss": 1.2703, "step": 34019 }, { "epoch": 0.93, "learning_rate": 2.626673972425764e-07, "loss": 1.3628, "step": 34020 }, { "epoch": 0.93, "learning_rate": 2.6246604033262955e-07, "loss": 1.3586, "step": 34021 }, { "epoch": 0.93, "learning_rate": 2.622647596045691e-07, "loss": 1.3118, "step": 34022 }, { "epoch": 0.93, "learning_rate": 2.620635550599704e-07, "loss": 1.2212, "step": 34023 }, { "epoch": 0.93, "learning_rate": 2.618624267004066e-07, "loss": 1.2937, "step": 34024 }, { "epoch": 0.93, "learning_rate": 2.616613745274532e-07, "loss": 1.3066, "step": 34025 }, { "epoch": 0.93, "learning_rate": 2.6146039854268e-07, "loss": 1.2573, "step": 34026 }, { "epoch": 0.93, "learning_rate": 2.612594987476624e-07, "loss": 1.3667, "step": 34027 }, { "epoch": 0.93, "learning_rate": 2.6105867514397145e-07, "loss": 1.344, "step": 34028 }, { "epoch": 0.93, "learning_rate": 2.6085792773317686e-07, "loss": 1.3386, "step": 34029 }, { "epoch": 0.93, "learning_rate": 2.6065725651685194e-07, "loss": 1.2397, "step": 34030 }, { "epoch": 0.93, "learning_rate": 2.60456661496562e-07, "loss": 1.3123, "step": 34031 }, { "epoch": 0.93, "learning_rate": 2.602561426738814e-07, "loss": 1.2126, "step": 34032 }, { "epoch": 0.93, "learning_rate": 2.6005570005037674e-07, "loss": 1.3345, "step": 34033 }, { "epoch": 0.93, "learning_rate": 2.598553336276166e-07, "loss": 1.353, "step": 34034 }, { "epoch": 0.93, "learning_rate": 2.596550434071665e-07, "loss": 1.0798, "step": 34035 }, { "epoch": 0.93, "learning_rate": 2.594548293905963e-07, "loss": 1.2488, "step": 34036 }, { "epoch": 0.93, "learning_rate": 2.5925469157947135e-07, "loss": 1.1865, "step": 34037 }, { "epoch": 0.93, "learning_rate": 2.590546299753571e-07, "loss": 1.2778, "step": 34038 }, { "epoch": 0.93, "learning_rate": 2.588546445798179e-07, "loss": 1.272, "step": 34039 }, { "epoch": 0.93, "learning_rate": 2.5865473539442023e-07, "loss": 1.2141, "step": 34040 }, { "epoch": 0.93, "learning_rate": 2.5845490242072723e-07, "loss": 1.2463, "step": 34041 }, { "epoch": 0.93, "learning_rate": 2.582551456603022e-07, "loss": 1.2158, "step": 34042 }, { "epoch": 0.93, "learning_rate": 2.5805546511470826e-07, "loss": 1.1392, "step": 34043 }, { "epoch": 0.93, "learning_rate": 2.578558607855064e-07, "loss": 1.2507, "step": 34044 }, { "epoch": 0.93, "learning_rate": 2.576563326742609e-07, "loss": 1.3713, "step": 34045 }, { "epoch": 0.93, "learning_rate": 2.574568807825295e-07, "loss": 1.3638, "step": 34046 }, { "epoch": 0.93, "learning_rate": 2.5725750511187417e-07, "loss": 1.2695, "step": 34047 }, { "epoch": 0.93, "learning_rate": 2.57058205663856e-07, "loss": 1.1919, "step": 34048 }, { "epoch": 0.93, "learning_rate": 2.568589824400325e-07, "loss": 1.3499, "step": 34049 }, { "epoch": 0.93, "learning_rate": 2.566598354419625e-07, "loss": 1.219, "step": 34050 }, { "epoch": 0.93, "learning_rate": 2.564607646712047e-07, "loss": 1.3054, "step": 34051 }, { "epoch": 0.93, "learning_rate": 2.5626177012931573e-07, "loss": 1.25, "step": 34052 }, { "epoch": 0.93, "learning_rate": 2.560628518178532e-07, "loss": 1.1055, "step": 34053 }, { "epoch": 0.93, "learning_rate": 2.5586400973837244e-07, "loss": 1.2974, "step": 34054 }, { "epoch": 0.93, "learning_rate": 2.5566524389243006e-07, "loss": 1.0239, "step": 34055 }, { "epoch": 0.93, "learning_rate": 2.554665542815804e-07, "loss": 1.292, "step": 34056 }, { "epoch": 0.93, "learning_rate": 2.5526794090737883e-07, "loss": 1.1748, "step": 34057 }, { "epoch": 0.93, "learning_rate": 2.5506940377137747e-07, "loss": 1.1978, "step": 34058 }, { "epoch": 0.93, "learning_rate": 2.548709428751306e-07, "loss": 1.322, "step": 34059 }, { "epoch": 0.93, "learning_rate": 2.5467255822019363e-07, "loss": 1.1702, "step": 34060 }, { "epoch": 0.93, "learning_rate": 2.544742498081132e-07, "loss": 1.2737, "step": 34061 }, { "epoch": 0.93, "learning_rate": 2.542760176404446e-07, "loss": 1.314, "step": 34062 }, { "epoch": 0.93, "learning_rate": 2.540778617187378e-07, "loss": 1.345, "step": 34063 }, { "epoch": 0.93, "learning_rate": 2.5387978204454377e-07, "loss": 1.4504, "step": 34064 }, { "epoch": 0.93, "learning_rate": 2.53681778619409e-07, "loss": 1.3486, "step": 34065 }, { "epoch": 0.93, "learning_rate": 2.5348385144488675e-07, "loss": 1.2988, "step": 34066 }, { "epoch": 0.93, "learning_rate": 2.532860005225235e-07, "loss": 1.3628, "step": 34067 }, { "epoch": 0.93, "learning_rate": 2.5308822585386804e-07, "loss": 1.1069, "step": 34068 }, { "epoch": 0.93, "learning_rate": 2.528905274404658e-07, "loss": 1.0957, "step": 34069 }, { "epoch": 0.93, "learning_rate": 2.526929052838645e-07, "loss": 1.1506, "step": 34070 }, { "epoch": 0.93, "learning_rate": 2.5249535938561055e-07, "loss": 1.2695, "step": 34071 }, { "epoch": 0.93, "learning_rate": 2.522978897472506e-07, "loss": 1.2786, "step": 34072 }, { "epoch": 0.93, "learning_rate": 2.5210049637032666e-07, "loss": 1.1943, "step": 34073 }, { "epoch": 0.93, "learning_rate": 2.519031792563853e-07, "loss": 1.2754, "step": 34074 }, { "epoch": 0.93, "learning_rate": 2.517059384069698e-07, "loss": 1.2598, "step": 34075 }, { "epoch": 0.93, "learning_rate": 2.515087738236222e-07, "loss": 1.3308, "step": 34076 }, { "epoch": 0.93, "learning_rate": 2.5131168550788674e-07, "loss": 1.198, "step": 34077 }, { "epoch": 0.93, "learning_rate": 2.5111467346130456e-07, "loss": 1.2825, "step": 34078 }, { "epoch": 0.93, "learning_rate": 2.509177376854166e-07, "loss": 1.2649, "step": 34079 }, { "epoch": 0.93, "learning_rate": 2.507208781817638e-07, "loss": 1.186, "step": 34080 }, { "epoch": 0.93, "learning_rate": 2.5052409495188723e-07, "loss": 1.2561, "step": 34081 }, { "epoch": 0.93, "learning_rate": 2.503273879973245e-07, "loss": 1.321, "step": 34082 }, { "epoch": 0.93, "learning_rate": 2.501307573196166e-07, "loss": 1.2983, "step": 34083 }, { "epoch": 0.93, "learning_rate": 2.4993420292030004e-07, "loss": 1.3066, "step": 34084 }, { "epoch": 0.93, "learning_rate": 2.497377248009147e-07, "loss": 1.3633, "step": 34085 }, { "epoch": 0.93, "learning_rate": 2.4954132296299507e-07, "loss": 1.2878, "step": 34086 }, { "epoch": 0.93, "learning_rate": 2.493449974080797e-07, "loss": 1.4021, "step": 34087 }, { "epoch": 0.93, "learning_rate": 2.491487481377042e-07, "loss": 1.0076, "step": 34088 }, { "epoch": 0.93, "learning_rate": 2.489525751534039e-07, "loss": 1.2168, "step": 34089 }, { "epoch": 0.93, "learning_rate": 2.487564784567131e-07, "loss": 1.1228, "step": 34090 }, { "epoch": 0.93, "learning_rate": 2.485604580491663e-07, "loss": 1.2456, "step": 34091 }, { "epoch": 0.93, "learning_rate": 2.4836451393229766e-07, "loss": 1.2493, "step": 34092 }, { "epoch": 0.93, "learning_rate": 2.4816864610763824e-07, "loss": 1.2292, "step": 34093 }, { "epoch": 0.93, "learning_rate": 2.479728545767224e-07, "loss": 1.7124, "step": 34094 }, { "epoch": 0.93, "learning_rate": 2.4777713934108107e-07, "loss": 1.3047, "step": 34095 }, { "epoch": 0.93, "learning_rate": 2.475815004022464e-07, "loss": 1.2288, "step": 34096 }, { "epoch": 0.93, "learning_rate": 2.47385937761746e-07, "loss": 1.1003, "step": 34097 }, { "epoch": 0.93, "learning_rate": 2.471904514211143e-07, "loss": 1.3364, "step": 34098 }, { "epoch": 0.93, "learning_rate": 2.469950413818778e-07, "loss": 0.9929, "step": 34099 }, { "epoch": 0.93, "learning_rate": 2.4679970764556527e-07, "loss": 1.2979, "step": 34100 }, { "epoch": 0.93, "learning_rate": 2.466044502137055e-07, "loss": 1.281, "step": 34101 }, { "epoch": 0.93, "learning_rate": 2.4640926908782725e-07, "loss": 1.2104, "step": 34102 }, { "epoch": 0.93, "learning_rate": 2.46214164269456e-07, "loss": 1.2976, "step": 34103 }, { "epoch": 0.93, "learning_rate": 2.460191357601183e-07, "loss": 1.2139, "step": 34104 }, { "epoch": 0.93, "learning_rate": 2.4582418356133953e-07, "loss": 1.4856, "step": 34105 }, { "epoch": 0.93, "learning_rate": 2.456293076746452e-07, "loss": 1.283, "step": 34106 }, { "epoch": 0.93, "learning_rate": 2.45434508101563e-07, "loss": 1.3647, "step": 34107 }, { "epoch": 0.93, "learning_rate": 2.452397848436128e-07, "loss": 1.1409, "step": 34108 }, { "epoch": 0.93, "learning_rate": 2.4504513790231887e-07, "loss": 1.3386, "step": 34109 }, { "epoch": 0.93, "learning_rate": 2.448505672792045e-07, "loss": 1.3428, "step": 34110 }, { "epoch": 0.93, "learning_rate": 2.446560729757952e-07, "loss": 1.2949, "step": 34111 }, { "epoch": 0.93, "learning_rate": 2.444616549936063e-07, "loss": 1.2444, "step": 34112 }, { "epoch": 0.93, "learning_rate": 2.4426731333416334e-07, "loss": 1.1836, "step": 34113 }, { "epoch": 0.93, "learning_rate": 2.440730479989839e-07, "loss": 1.7041, "step": 34114 }, { "epoch": 0.93, "learning_rate": 2.438788589895913e-07, "loss": 1.2334, "step": 34115 }, { "epoch": 0.93, "learning_rate": 2.4368474630750206e-07, "loss": 1.2722, "step": 34116 }, { "epoch": 0.93, "learning_rate": 2.434907099542361e-07, "loss": 1.1091, "step": 34117 }, { "epoch": 0.93, "learning_rate": 2.432967499313088e-07, "loss": 1.3657, "step": 34118 }, { "epoch": 0.93, "learning_rate": 2.431028662402435e-07, "loss": 1.153, "step": 34119 }, { "epoch": 0.93, "learning_rate": 2.4290905888255e-07, "loss": 1.1689, "step": 34120 }, { "epoch": 0.93, "learning_rate": 2.427153278597494e-07, "loss": 1.1519, "step": 34121 }, { "epoch": 0.93, "learning_rate": 2.4252167317335594e-07, "loss": 1.1174, "step": 34122 }, { "epoch": 0.93, "learning_rate": 2.423280948248841e-07, "loss": 1.1035, "step": 34123 }, { "epoch": 0.93, "learning_rate": 2.4213459281585027e-07, "loss": 1.2395, "step": 34124 }, { "epoch": 0.93, "learning_rate": 2.419411671477645e-07, "loss": 1.1853, "step": 34125 }, { "epoch": 0.93, "learning_rate": 2.417478178221444e-07, "loss": 1.708, "step": 34126 }, { "epoch": 0.93, "learning_rate": 2.41554544840501e-07, "loss": 1.2239, "step": 34127 }, { "epoch": 0.93, "learning_rate": 2.4136134820434533e-07, "loss": 1.2566, "step": 34128 }, { "epoch": 0.93, "learning_rate": 2.4116822791518835e-07, "loss": 1.2734, "step": 34129 }, { "epoch": 0.93, "learning_rate": 2.4097518397454447e-07, "loss": 1.3435, "step": 34130 }, { "epoch": 0.93, "learning_rate": 2.407822163839202e-07, "loss": 1.1248, "step": 34131 }, { "epoch": 0.93, "learning_rate": 2.405893251448277e-07, "loss": 1.3503, "step": 34132 }, { "epoch": 0.93, "learning_rate": 2.4039651025877465e-07, "loss": 1.2732, "step": 34133 }, { "epoch": 0.93, "learning_rate": 2.402037717272698e-07, "loss": 1.2441, "step": 34134 }, { "epoch": 0.93, "learning_rate": 2.4001110955182205e-07, "loss": 1.2969, "step": 34135 }, { "epoch": 0.93, "learning_rate": 2.3981852373393677e-07, "loss": 1.1842, "step": 34136 }, { "epoch": 0.93, "learning_rate": 2.396260142751228e-07, "loss": 1.2319, "step": 34137 }, { "epoch": 0.93, "learning_rate": 2.3943358117688445e-07, "loss": 1.2356, "step": 34138 }, { "epoch": 0.93, "learning_rate": 2.392412244407294e-07, "loss": 1.2629, "step": 34139 }, { "epoch": 0.93, "learning_rate": 2.390489440681587e-07, "loss": 1.4236, "step": 34140 }, { "epoch": 0.93, "learning_rate": 2.3885674006068116e-07, "loss": 1.3738, "step": 34141 }, { "epoch": 0.93, "learning_rate": 2.386646124197989e-07, "loss": 1.2036, "step": 34142 }, { "epoch": 0.93, "learning_rate": 2.38472561147014e-07, "loss": 1.3181, "step": 34143 }, { "epoch": 0.93, "learning_rate": 2.3828058624382756e-07, "loss": 1.3323, "step": 34144 }, { "epoch": 0.93, "learning_rate": 2.380886877117461e-07, "loss": 1.1453, "step": 34145 }, { "epoch": 0.93, "learning_rate": 2.3789686555226732e-07, "loss": 1.709, "step": 34146 }, { "epoch": 0.93, "learning_rate": 2.3770511976689337e-07, "loss": 1.2224, "step": 34147 }, { "epoch": 0.93, "learning_rate": 2.3751345035712413e-07, "loss": 1.3516, "step": 34148 }, { "epoch": 0.93, "learning_rate": 2.3732185732445846e-07, "loss": 1.0153, "step": 34149 }, { "epoch": 0.93, "learning_rate": 2.3713034067039619e-07, "loss": 1.3235, "step": 34150 }, { "epoch": 0.93, "learning_rate": 2.3693890039643507e-07, "loss": 1.252, "step": 34151 }, { "epoch": 0.93, "learning_rate": 2.3674753650407278e-07, "loss": 1.2903, "step": 34152 }, { "epoch": 0.93, "learning_rate": 2.36556248994807e-07, "loss": 1.2236, "step": 34153 }, { "epoch": 0.93, "learning_rate": 2.3636503787013541e-07, "loss": 1.2732, "step": 34154 }, { "epoch": 0.93, "learning_rate": 2.361739031315502e-07, "loss": 1.1917, "step": 34155 }, { "epoch": 0.93, "learning_rate": 2.3598284478055123e-07, "loss": 1.1787, "step": 34156 }, { "epoch": 0.93, "learning_rate": 2.3579186281862952e-07, "loss": 1.2588, "step": 34157 }, { "epoch": 0.93, "learning_rate": 2.3560095724728282e-07, "loss": 1.2632, "step": 34158 }, { "epoch": 0.93, "learning_rate": 2.354101280679999e-07, "loss": 1.3528, "step": 34159 }, { "epoch": 0.93, "learning_rate": 2.3521937528227846e-07, "loss": 1.2554, "step": 34160 }, { "epoch": 0.93, "learning_rate": 2.350286988916084e-07, "loss": 0.979, "step": 34161 }, { "epoch": 0.93, "learning_rate": 2.3483809889748298e-07, "loss": 1.2122, "step": 34162 }, { "epoch": 0.93, "learning_rate": 2.3464757530138993e-07, "loss": 1.2625, "step": 34163 }, { "epoch": 0.93, "learning_rate": 2.3445712810482468e-07, "loss": 1.2463, "step": 34164 }, { "epoch": 0.93, "learning_rate": 2.3426675730927273e-07, "loss": 1.2852, "step": 34165 }, { "epoch": 0.93, "learning_rate": 2.3407646291622844e-07, "loss": 1.2271, "step": 34166 }, { "epoch": 0.93, "learning_rate": 2.3388624492717504e-07, "loss": 1.3306, "step": 34167 }, { "epoch": 0.93, "learning_rate": 2.336961033436036e-07, "loss": 1.2388, "step": 34168 }, { "epoch": 0.93, "learning_rate": 2.335060381670018e-07, "loss": 1.1897, "step": 34169 }, { "epoch": 0.93, "learning_rate": 2.333160493988562e-07, "loss": 1.1096, "step": 34170 }, { "epoch": 0.93, "learning_rate": 2.3312613704065347e-07, "loss": 1.27, "step": 34171 }, { "epoch": 0.93, "learning_rate": 2.3293630109387899e-07, "loss": 1.1768, "step": 34172 }, { "epoch": 0.93, "learning_rate": 2.327465415600183e-07, "loss": 1.3179, "step": 34173 }, { "epoch": 0.93, "learning_rate": 2.3255685844055576e-07, "loss": 1.2119, "step": 34174 }, { "epoch": 0.93, "learning_rate": 2.323672517369746e-07, "loss": 1.1755, "step": 34175 }, { "epoch": 0.93, "learning_rate": 2.3217772145075922e-07, "loss": 1.2251, "step": 34176 }, { "epoch": 0.93, "learning_rate": 2.3198826758339287e-07, "loss": 1.304, "step": 34177 }, { "epoch": 0.93, "learning_rate": 2.3179889013635771e-07, "loss": 1.3186, "step": 34178 }, { "epoch": 0.93, "learning_rate": 2.3160958911113362e-07, "loss": 1.3003, "step": 34179 }, { "epoch": 0.93, "learning_rate": 2.3142036450920168e-07, "loss": 1.3667, "step": 34180 }, { "epoch": 0.93, "learning_rate": 2.3123121633204515e-07, "loss": 1.4316, "step": 34181 }, { "epoch": 0.93, "learning_rate": 2.310421445811417e-07, "loss": 1.2163, "step": 34182 }, { "epoch": 0.93, "learning_rate": 2.308531492579691e-07, "loss": 1.2395, "step": 34183 }, { "epoch": 0.93, "learning_rate": 2.306642303640094e-07, "loss": 1.2869, "step": 34184 }, { "epoch": 0.93, "learning_rate": 2.3047538790073931e-07, "loss": 1.3406, "step": 34185 }, { "epoch": 0.93, "learning_rate": 2.3028662186963536e-07, "loss": 1.4426, "step": 34186 }, { "epoch": 0.93, "learning_rate": 2.3009793227217304e-07, "loss": 1.2197, "step": 34187 }, { "epoch": 0.93, "learning_rate": 2.2990931910983226e-07, "loss": 1.2642, "step": 34188 }, { "epoch": 0.93, "learning_rate": 2.2972078238408635e-07, "loss": 1.2996, "step": 34189 }, { "epoch": 0.93, "learning_rate": 2.2953232209641185e-07, "loss": 1.2676, "step": 34190 }, { "epoch": 0.93, "learning_rate": 2.2934393824827984e-07, "loss": 1.2434, "step": 34191 }, { "epoch": 0.93, "learning_rate": 2.2915563084116798e-07, "loss": 1.3198, "step": 34192 }, { "epoch": 0.93, "learning_rate": 2.2896739987654737e-07, "loss": 1.2451, "step": 34193 }, { "epoch": 0.93, "learning_rate": 2.2877924535589124e-07, "loss": 1.1042, "step": 34194 }, { "epoch": 0.93, "learning_rate": 2.2859116728067065e-07, "loss": 1.2109, "step": 34195 }, { "epoch": 0.93, "learning_rate": 2.2840316565235886e-07, "loss": 1.1614, "step": 34196 }, { "epoch": 0.93, "learning_rate": 2.2821524047242583e-07, "loss": 1.1987, "step": 34197 }, { "epoch": 0.93, "learning_rate": 2.2802739174234145e-07, "loss": 1.2859, "step": 34198 }, { "epoch": 0.93, "learning_rate": 2.2783961946357568e-07, "loss": 1.2683, "step": 34199 }, { "epoch": 0.93, "learning_rate": 2.2765192363759737e-07, "loss": 1.291, "step": 34200 }, { "epoch": 0.93, "learning_rate": 2.274643042658764e-07, "loss": 1.3882, "step": 34201 }, { "epoch": 0.93, "learning_rate": 2.272767613498772e-07, "loss": 1.6553, "step": 34202 }, { "epoch": 0.93, "learning_rate": 2.2708929489107078e-07, "loss": 1.3093, "step": 34203 }, { "epoch": 0.93, "learning_rate": 2.2690190489092045e-07, "loss": 1.2349, "step": 34204 }, { "epoch": 0.93, "learning_rate": 2.2671459135089724e-07, "loss": 1.3088, "step": 34205 }, { "epoch": 0.93, "learning_rate": 2.2652735427245997e-07, "loss": 1.2878, "step": 34206 }, { "epoch": 0.93, "learning_rate": 2.263401936570786e-07, "loss": 1.2166, "step": 34207 }, { "epoch": 0.93, "learning_rate": 2.2615310950621415e-07, "loss": 1.4072, "step": 34208 }, { "epoch": 0.93, "learning_rate": 2.2596610182133328e-07, "loss": 1.1018, "step": 34209 }, { "epoch": 0.93, "learning_rate": 2.257791706038981e-07, "loss": 1.2727, "step": 34210 }, { "epoch": 0.93, "learning_rate": 2.2559231585536966e-07, "loss": 1.2146, "step": 34211 }, { "epoch": 0.93, "learning_rate": 2.2540553757721017e-07, "loss": 1.3574, "step": 34212 }, { "epoch": 0.93, "learning_rate": 2.2521883577088178e-07, "loss": 1.3208, "step": 34213 }, { "epoch": 0.93, "learning_rate": 2.250322104378455e-07, "loss": 1.3357, "step": 34214 }, { "epoch": 0.93, "learning_rate": 2.2484566157955912e-07, "loss": 1.2639, "step": 34215 }, { "epoch": 0.93, "learning_rate": 2.2465918919748475e-07, "loss": 1.3083, "step": 34216 }, { "epoch": 0.93, "learning_rate": 2.2447279329308014e-07, "loss": 1.3372, "step": 34217 }, { "epoch": 0.93, "learning_rate": 2.2428647386780412e-07, "loss": 1.4263, "step": 34218 }, { "epoch": 0.93, "learning_rate": 2.2410023092311216e-07, "loss": 1.1624, "step": 34219 }, { "epoch": 0.93, "learning_rate": 2.2391406446046426e-07, "loss": 1.3071, "step": 34220 }, { "epoch": 0.93, "learning_rate": 2.237279744813159e-07, "loss": 1.7393, "step": 34221 }, { "epoch": 0.93, "learning_rate": 2.2354196098712366e-07, "loss": 1.2974, "step": 34222 }, { "epoch": 0.93, "learning_rate": 2.2335602397933974e-07, "loss": 1.2412, "step": 34223 }, { "epoch": 0.93, "learning_rate": 2.231701634594219e-07, "loss": 1.1309, "step": 34224 }, { "epoch": 0.93, "learning_rate": 2.2298437942882335e-07, "loss": 1.2119, "step": 34225 }, { "epoch": 0.93, "learning_rate": 2.227986718889985e-07, "loss": 1.2371, "step": 34226 }, { "epoch": 0.93, "learning_rate": 2.2261304084139734e-07, "loss": 1.3264, "step": 34227 }, { "epoch": 0.93, "learning_rate": 2.2242748628747536e-07, "loss": 1.3469, "step": 34228 }, { "epoch": 0.93, "learning_rate": 2.2224200822868247e-07, "loss": 1.3047, "step": 34229 }, { "epoch": 0.93, "learning_rate": 2.2205660666646978e-07, "loss": 1.1008, "step": 34230 }, { "epoch": 0.93, "learning_rate": 2.2187128160228942e-07, "loss": 1.2771, "step": 34231 }, { "epoch": 0.93, "learning_rate": 2.216860330375903e-07, "loss": 1.2808, "step": 34232 }, { "epoch": 0.93, "learning_rate": 2.2150086097382117e-07, "loss": 1.094, "step": 34233 }, { "epoch": 0.93, "learning_rate": 2.2131576541243095e-07, "loss": 1.3496, "step": 34234 }, { "epoch": 0.93, "learning_rate": 2.2113074635486731e-07, "loss": 1.1777, "step": 34235 }, { "epoch": 0.93, "learning_rate": 2.2094580380257912e-07, "loss": 1.3325, "step": 34236 }, { "epoch": 0.93, "learning_rate": 2.2076093775701302e-07, "loss": 1.3386, "step": 34237 }, { "epoch": 0.94, "learning_rate": 2.2057614821961337e-07, "loss": 1.1855, "step": 34238 }, { "epoch": 0.94, "learning_rate": 2.2039143519182903e-07, "loss": 1.3933, "step": 34239 }, { "epoch": 0.94, "learning_rate": 2.202067986751022e-07, "loss": 1.1458, "step": 34240 }, { "epoch": 0.94, "learning_rate": 2.2002223867087948e-07, "loss": 1.3076, "step": 34241 }, { "epoch": 0.94, "learning_rate": 2.19837755180603e-07, "loss": 1.282, "step": 34242 }, { "epoch": 0.94, "learning_rate": 2.1965334820571726e-07, "loss": 1.2729, "step": 34243 }, { "epoch": 0.94, "learning_rate": 2.194690177476644e-07, "loss": 1.1627, "step": 34244 }, { "epoch": 0.94, "learning_rate": 2.1928476380788765e-07, "loss": 1.2959, "step": 34245 }, { "epoch": 0.94, "learning_rate": 2.1910058638782706e-07, "loss": 1.2119, "step": 34246 }, { "epoch": 0.94, "learning_rate": 2.1891648548892363e-07, "loss": 1.405, "step": 34247 }, { "epoch": 0.94, "learning_rate": 2.1873246111261958e-07, "loss": 1.3369, "step": 34248 }, { "epoch": 0.94, "learning_rate": 2.1854851326035264e-07, "loss": 1.2478, "step": 34249 }, { "epoch": 0.94, "learning_rate": 2.1836464193356277e-07, "loss": 1.3164, "step": 34250 }, { "epoch": 0.94, "learning_rate": 2.181808471336877e-07, "loss": 1.324, "step": 34251 }, { "epoch": 0.94, "learning_rate": 2.1799712886216628e-07, "loss": 1.2002, "step": 34252 }, { "epoch": 0.94, "learning_rate": 2.1781348712043627e-07, "loss": 1.2361, "step": 34253 }, { "epoch": 0.94, "learning_rate": 2.1762992190993314e-07, "loss": 1.2854, "step": 34254 }, { "epoch": 0.94, "learning_rate": 2.1744643323209246e-07, "loss": 1.3835, "step": 34255 }, { "epoch": 0.94, "learning_rate": 2.1726302108835194e-07, "loss": 1.2261, "step": 34256 }, { "epoch": 0.94, "learning_rate": 2.1707968548014492e-07, "loss": 1.1404, "step": 34257 }, { "epoch": 0.94, "learning_rate": 2.1689642640890684e-07, "loss": 1.3518, "step": 34258 }, { "epoch": 0.94, "learning_rate": 2.1671324387606884e-07, "loss": 1.1509, "step": 34259 }, { "epoch": 0.94, "learning_rate": 2.1653013788306866e-07, "loss": 1.1982, "step": 34260 }, { "epoch": 0.94, "learning_rate": 2.163471084313351e-07, "loss": 1.261, "step": 34261 }, { "epoch": 0.94, "learning_rate": 2.161641555223004e-07, "loss": 1.3328, "step": 34262 }, { "epoch": 0.94, "learning_rate": 2.1598127915739676e-07, "loss": 1.2412, "step": 34263 }, { "epoch": 0.94, "learning_rate": 2.157984793380563e-07, "loss": 1.2397, "step": 34264 }, { "epoch": 0.94, "learning_rate": 2.1561575606570684e-07, "loss": 1.3613, "step": 34265 }, { "epoch": 0.94, "learning_rate": 2.154331093417772e-07, "loss": 1.3748, "step": 34266 }, { "epoch": 0.94, "learning_rate": 2.1525053916769955e-07, "loss": 1.2981, "step": 34267 }, { "epoch": 0.94, "learning_rate": 2.1506804554490168e-07, "loss": 1.1033, "step": 34268 }, { "epoch": 0.94, "learning_rate": 2.148856284748091e-07, "loss": 1.2646, "step": 34269 }, { "epoch": 0.94, "learning_rate": 2.1470328795884844e-07, "loss": 1.1299, "step": 34270 }, { "epoch": 0.94, "learning_rate": 2.1452102399844964e-07, "loss": 1.2515, "step": 34271 }, { "epoch": 0.94, "learning_rate": 2.143388365950372e-07, "loss": 1.1582, "step": 34272 }, { "epoch": 0.94, "learning_rate": 2.1415672575003543e-07, "loss": 1.2434, "step": 34273 }, { "epoch": 0.94, "learning_rate": 2.1397469146486883e-07, "loss": 1.2712, "step": 34274 }, { "epoch": 0.94, "learning_rate": 2.1379273374096399e-07, "loss": 1.396, "step": 34275 }, { "epoch": 0.94, "learning_rate": 2.136108525797431e-07, "loss": 1.3057, "step": 34276 }, { "epoch": 0.94, "learning_rate": 2.1342904798262843e-07, "loss": 1.2578, "step": 34277 }, { "epoch": 0.94, "learning_rate": 2.132473199510432e-07, "loss": 1.1624, "step": 34278 }, { "epoch": 0.94, "learning_rate": 2.1306566848640742e-07, "loss": 1.2937, "step": 34279 }, { "epoch": 0.94, "learning_rate": 2.128840935901466e-07, "loss": 1.1743, "step": 34280 }, { "epoch": 0.94, "learning_rate": 2.127025952636763e-07, "loss": 1.2122, "step": 34281 }, { "epoch": 0.94, "learning_rate": 2.125211735084187e-07, "loss": 1.2644, "step": 34282 }, { "epoch": 0.94, "learning_rate": 2.1233982832579269e-07, "loss": 1.2415, "step": 34283 }, { "epoch": 0.94, "learning_rate": 2.1215855971721933e-07, "loss": 1.2837, "step": 34284 }, { "epoch": 0.94, "learning_rate": 2.1197736768411304e-07, "loss": 1.0938, "step": 34285 }, { "epoch": 0.94, "learning_rate": 2.117962522278938e-07, "loss": 1.395, "step": 34286 }, { "epoch": 0.94, "learning_rate": 2.1161521334997825e-07, "loss": 1.2915, "step": 34287 }, { "epoch": 0.94, "learning_rate": 2.1143425105178306e-07, "loss": 1.2109, "step": 34288 }, { "epoch": 0.94, "learning_rate": 2.1125336533472153e-07, "loss": 1.3132, "step": 34289 }, { "epoch": 0.94, "learning_rate": 2.1107255620021138e-07, "loss": 1.29, "step": 34290 }, { "epoch": 0.94, "learning_rate": 2.1089182364966599e-07, "loss": 1.2366, "step": 34291 }, { "epoch": 0.94, "learning_rate": 2.1071116768450083e-07, "loss": 1.1177, "step": 34292 }, { "epoch": 0.94, "learning_rate": 2.1053058830612817e-07, "loss": 1.2554, "step": 34293 }, { "epoch": 0.94, "learning_rate": 2.1035008551596013e-07, "loss": 1.1709, "step": 34294 }, { "epoch": 0.94, "learning_rate": 2.1016965931541012e-07, "loss": 1.2838, "step": 34295 }, { "epoch": 0.94, "learning_rate": 2.0998930970588915e-07, "loss": 1.1824, "step": 34296 }, { "epoch": 0.94, "learning_rate": 2.0980903668880946e-07, "loss": 1.3628, "step": 34297 }, { "epoch": 0.94, "learning_rate": 2.0962884026557774e-07, "loss": 1.1228, "step": 34298 }, { "epoch": 0.94, "learning_rate": 2.094487204376072e-07, "loss": 1.3096, "step": 34299 }, { "epoch": 0.94, "learning_rate": 2.0926867720630682e-07, "loss": 1.3181, "step": 34300 }, { "epoch": 0.94, "learning_rate": 2.0908871057308434e-07, "loss": 1.2839, "step": 34301 }, { "epoch": 0.94, "learning_rate": 2.0890882053934637e-07, "loss": 1.312, "step": 34302 }, { "epoch": 0.94, "learning_rate": 2.087290071065029e-07, "loss": 1.3625, "step": 34303 }, { "epoch": 0.94, "learning_rate": 2.085492702759595e-07, "loss": 1.3428, "step": 34304 }, { "epoch": 0.94, "learning_rate": 2.0836961004912282e-07, "loss": 1.2534, "step": 34305 }, { "epoch": 0.94, "learning_rate": 2.0819002642739615e-07, "loss": 1.3364, "step": 34306 }, { "epoch": 0.94, "learning_rate": 2.080105194121873e-07, "loss": 1.3726, "step": 34307 }, { "epoch": 0.94, "learning_rate": 2.0783108900489956e-07, "loss": 1.3071, "step": 34308 }, { "epoch": 0.94, "learning_rate": 2.0765173520693627e-07, "loss": 1.1482, "step": 34309 }, { "epoch": 0.94, "learning_rate": 2.0747245801970184e-07, "loss": 1.2207, "step": 34310 }, { "epoch": 0.94, "learning_rate": 2.072932574445985e-07, "loss": 1.1262, "step": 34311 }, { "epoch": 0.94, "learning_rate": 2.0711413348302733e-07, "loss": 1.1601, "step": 34312 }, { "epoch": 0.94, "learning_rate": 2.0693508613639058e-07, "loss": 1.3535, "step": 34313 }, { "epoch": 0.94, "learning_rate": 2.067561154060882e-07, "loss": 1.2556, "step": 34314 }, { "epoch": 0.94, "learning_rate": 2.065772212935213e-07, "loss": 1.4087, "step": 34315 }, { "epoch": 0.94, "learning_rate": 2.063984038000888e-07, "loss": 1.0552, "step": 34316 }, { "epoch": 0.94, "learning_rate": 2.0621966292718952e-07, "loss": 1.2445, "step": 34317 }, { "epoch": 0.94, "learning_rate": 2.060409986762224e-07, "loss": 1.1055, "step": 34318 }, { "epoch": 0.94, "learning_rate": 2.058624110485863e-07, "loss": 1.3125, "step": 34319 }, { "epoch": 0.94, "learning_rate": 2.0568390004567563e-07, "loss": 1.3209, "step": 34320 }, { "epoch": 0.94, "learning_rate": 2.0550546566888819e-07, "loss": 1.2278, "step": 34321 }, { "epoch": 0.94, "learning_rate": 2.0532710791962064e-07, "loss": 1.1777, "step": 34322 }, { "epoch": 0.94, "learning_rate": 2.0514882679926962e-07, "loss": 1.2952, "step": 34323 }, { "epoch": 0.94, "learning_rate": 2.0497062230922626e-07, "loss": 1.3804, "step": 34324 }, { "epoch": 0.94, "learning_rate": 2.0479249445088833e-07, "loss": 1.3235, "step": 34325 }, { "epoch": 0.94, "learning_rate": 2.0461444322564693e-07, "loss": 1.075, "step": 34326 }, { "epoch": 0.94, "learning_rate": 2.0443646863489764e-07, "loss": 1.1636, "step": 34327 }, { "epoch": 0.94, "learning_rate": 2.042585706800293e-07, "loss": 1.1731, "step": 34328 }, { "epoch": 0.94, "learning_rate": 2.0408074936243637e-07, "loss": 1.3579, "step": 34329 }, { "epoch": 0.94, "learning_rate": 2.0390300468350888e-07, "loss": 1.7729, "step": 34330 }, { "epoch": 0.94, "learning_rate": 2.03725336644639e-07, "loss": 1.709, "step": 34331 }, { "epoch": 0.94, "learning_rate": 2.0354774524721455e-07, "loss": 1.2434, "step": 34332 }, { "epoch": 0.94, "learning_rate": 2.033702304926255e-07, "loss": 1.283, "step": 34333 }, { "epoch": 0.94, "learning_rate": 2.0319279238226186e-07, "loss": 1.2275, "step": 34334 }, { "epoch": 0.94, "learning_rate": 2.030154309175114e-07, "loss": 1.2566, "step": 34335 }, { "epoch": 0.94, "learning_rate": 2.028381460997597e-07, "loss": 1.2161, "step": 34336 }, { "epoch": 0.94, "learning_rate": 2.0266093793039677e-07, "loss": 1.2476, "step": 34337 }, { "epoch": 0.94, "learning_rate": 2.02483806410807e-07, "loss": 1.3411, "step": 34338 }, { "epoch": 0.94, "learning_rate": 2.0230675154237712e-07, "loss": 1.2363, "step": 34339 }, { "epoch": 0.94, "learning_rate": 2.0212977332649263e-07, "loss": 1.3462, "step": 34340 }, { "epoch": 0.94, "learning_rate": 2.0195287176453582e-07, "loss": 1.1841, "step": 34341 }, { "epoch": 0.94, "learning_rate": 2.0177604685789443e-07, "loss": 1.2732, "step": 34342 }, { "epoch": 0.94, "learning_rate": 2.0159929860794847e-07, "loss": 1.3916, "step": 34343 }, { "epoch": 0.94, "learning_rate": 2.014226270160835e-07, "loss": 1.3247, "step": 34344 }, { "epoch": 0.94, "learning_rate": 2.0124603208367842e-07, "loss": 1.3523, "step": 34345 }, { "epoch": 0.94, "learning_rate": 2.0106951381211771e-07, "loss": 1.4111, "step": 34346 }, { "epoch": 0.94, "learning_rate": 2.0089307220278132e-07, "loss": 1.2783, "step": 34347 }, { "epoch": 0.94, "learning_rate": 2.0071670725704928e-07, "loss": 1.3584, "step": 34348 }, { "epoch": 0.94, "learning_rate": 2.005404189763016e-07, "loss": 1.2244, "step": 34349 }, { "epoch": 0.94, "learning_rate": 2.003642073619183e-07, "loss": 1.3489, "step": 34350 }, { "epoch": 0.94, "learning_rate": 2.0018807241527716e-07, "loss": 1.4412, "step": 34351 }, { "epoch": 0.94, "learning_rate": 2.0001201413775596e-07, "loss": 1.2783, "step": 34352 }, { "epoch": 0.94, "learning_rate": 1.9983603253073248e-07, "loss": 1.261, "step": 34353 }, { "epoch": 0.94, "learning_rate": 1.996601275955845e-07, "loss": 1.3655, "step": 34354 }, { "epoch": 0.94, "learning_rate": 1.9948429933368653e-07, "loss": 1.3206, "step": 34355 }, { "epoch": 0.94, "learning_rate": 1.9930854774641406e-07, "loss": 1.2881, "step": 34356 }, { "epoch": 0.94, "learning_rate": 1.991328728351438e-07, "loss": 1.2686, "step": 34357 }, { "epoch": 0.94, "learning_rate": 1.9895727460124915e-07, "loss": 1.3164, "step": 34358 }, { "epoch": 0.94, "learning_rate": 1.9878175304610447e-07, "loss": 1.2983, "step": 34359 }, { "epoch": 0.94, "learning_rate": 1.9860630817108205e-07, "loss": 1.1443, "step": 34360 }, { "epoch": 0.94, "learning_rate": 1.9843093997755525e-07, "loss": 1.0876, "step": 34361 }, { "epoch": 0.94, "learning_rate": 1.9825564846689517e-07, "loss": 1.2378, "step": 34362 }, { "epoch": 0.94, "learning_rate": 1.9808043364047403e-07, "loss": 0.9814, "step": 34363 }, { "epoch": 0.94, "learning_rate": 1.9790529549966186e-07, "loss": 1.2939, "step": 34364 }, { "epoch": 0.94, "learning_rate": 1.9773023404583093e-07, "loss": 1.3188, "step": 34365 }, { "epoch": 0.94, "learning_rate": 1.9755524928034787e-07, "loss": 1.2283, "step": 34366 }, { "epoch": 0.94, "learning_rate": 1.9738034120458382e-07, "loss": 1.2371, "step": 34367 }, { "epoch": 0.94, "learning_rate": 1.972055098199055e-07, "loss": 1.2612, "step": 34368 }, { "epoch": 0.94, "learning_rate": 1.9703075512768177e-07, "loss": 1.2292, "step": 34369 }, { "epoch": 0.94, "learning_rate": 1.9685607712928157e-07, "loss": 1.3584, "step": 34370 }, { "epoch": 0.94, "learning_rate": 1.9668147582606824e-07, "loss": 1.2465, "step": 34371 }, { "epoch": 0.94, "learning_rate": 1.9650695121940955e-07, "loss": 1.2478, "step": 34372 }, { "epoch": 0.94, "learning_rate": 1.9633250331067e-07, "loss": 1.2117, "step": 34373 }, { "epoch": 0.94, "learning_rate": 1.9615813210121626e-07, "loss": 1.1924, "step": 34374 }, { "epoch": 0.94, "learning_rate": 1.9598383759240948e-07, "loss": 1.2249, "step": 34375 }, { "epoch": 0.94, "learning_rate": 1.958096197856163e-07, "loss": 1.3091, "step": 34376 }, { "epoch": 0.94, "learning_rate": 1.956354786821968e-07, "loss": 1.3391, "step": 34377 }, { "epoch": 0.94, "learning_rate": 1.9546141428351762e-07, "loss": 1.1895, "step": 34378 }, { "epoch": 0.94, "learning_rate": 1.9528742659093548e-07, "loss": 1.3257, "step": 34379 }, { "epoch": 0.94, "learning_rate": 1.9511351560581482e-07, "loss": 1.2219, "step": 34380 }, { "epoch": 0.94, "learning_rate": 1.9493968132951456e-07, "loss": 1.2224, "step": 34381 }, { "epoch": 0.94, "learning_rate": 1.947659237633981e-07, "loss": 1.0627, "step": 34382 }, { "epoch": 0.94, "learning_rate": 1.9459224290881985e-07, "loss": 1.3042, "step": 34383 }, { "epoch": 0.94, "learning_rate": 1.9441863876714096e-07, "loss": 1.334, "step": 34384 }, { "epoch": 0.94, "learning_rate": 1.9424511133972147e-07, "loss": 1.2427, "step": 34385 }, { "epoch": 0.94, "learning_rate": 1.9407166062791694e-07, "loss": 1.1921, "step": 34386 }, { "epoch": 0.94, "learning_rate": 1.9389828663308408e-07, "loss": 1.071, "step": 34387 }, { "epoch": 0.94, "learning_rate": 1.9372498935657957e-07, "loss": 1.2358, "step": 34388 }, { "epoch": 0.94, "learning_rate": 1.935517687997601e-07, "loss": 1.3452, "step": 34389 }, { "epoch": 0.94, "learning_rate": 1.9337862496398018e-07, "loss": 1.356, "step": 34390 }, { "epoch": 0.94, "learning_rate": 1.9320555785059424e-07, "loss": 1.2446, "step": 34391 }, { "epoch": 0.94, "learning_rate": 1.9303256746095678e-07, "loss": 1.3584, "step": 34392 }, { "epoch": 0.94, "learning_rate": 1.9285965379642112e-07, "loss": 1.2971, "step": 34393 }, { "epoch": 0.94, "learning_rate": 1.9268681685833957e-07, "loss": 1.7646, "step": 34394 }, { "epoch": 0.94, "learning_rate": 1.9251405664806543e-07, "loss": 1.3335, "step": 34395 }, { "epoch": 0.94, "learning_rate": 1.9234137316694767e-07, "loss": 1.2559, "step": 34396 }, { "epoch": 0.94, "learning_rate": 1.9216876641634076e-07, "loss": 1.1509, "step": 34397 }, { "epoch": 0.94, "learning_rate": 1.9199623639759245e-07, "loss": 1.2312, "step": 34398 }, { "epoch": 0.94, "learning_rate": 1.9182378311205507e-07, "loss": 1.4038, "step": 34399 }, { "epoch": 0.94, "learning_rate": 1.9165140656107416e-07, "loss": 1.2086, "step": 34400 }, { "epoch": 0.94, "learning_rate": 1.91479106746002e-07, "loss": 1.1907, "step": 34401 }, { "epoch": 0.94, "learning_rate": 1.9130688366818417e-07, "loss": 1.2527, "step": 34402 }, { "epoch": 0.94, "learning_rate": 1.911347373289696e-07, "loss": 1.2805, "step": 34403 }, { "epoch": 0.94, "learning_rate": 1.9096266772970385e-07, "loss": 1.6655, "step": 34404 }, { "epoch": 0.94, "learning_rate": 1.9079067487173363e-07, "loss": 1.1228, "step": 34405 }, { "epoch": 0.94, "learning_rate": 1.9061875875640568e-07, "loss": 1.1929, "step": 34406 }, { "epoch": 0.94, "learning_rate": 1.9044691938506222e-07, "loss": 1.4124, "step": 34407 }, { "epoch": 0.94, "learning_rate": 1.9027515675904995e-07, "loss": 1.2671, "step": 34408 }, { "epoch": 0.94, "learning_rate": 1.9010347087971225e-07, "loss": 1.2949, "step": 34409 }, { "epoch": 0.94, "learning_rate": 1.899318617483925e-07, "loss": 1.2825, "step": 34410 }, { "epoch": 0.94, "learning_rate": 1.8976032936643185e-07, "loss": 1.2261, "step": 34411 }, { "epoch": 0.94, "learning_rate": 1.8958887373517365e-07, "loss": 1.3125, "step": 34412 }, { "epoch": 0.94, "learning_rate": 1.8941749485595906e-07, "loss": 1.2083, "step": 34413 }, { "epoch": 0.94, "learning_rate": 1.8924619273012923e-07, "loss": 1.1702, "step": 34414 }, { "epoch": 0.94, "learning_rate": 1.8907496735902199e-07, "loss": 1.2488, "step": 34415 }, { "epoch": 0.94, "learning_rate": 1.8890381874397957e-07, "loss": 1.2883, "step": 34416 }, { "epoch": 0.94, "learning_rate": 1.8873274688634203e-07, "loss": 1.1873, "step": 34417 }, { "epoch": 0.94, "learning_rate": 1.8856175178744385e-07, "loss": 1.1274, "step": 34418 }, { "epoch": 0.94, "learning_rate": 1.883908334486262e-07, "loss": 1.3386, "step": 34419 }, { "epoch": 0.94, "learning_rate": 1.8821999187122354e-07, "loss": 1.46, "step": 34420 }, { "epoch": 0.94, "learning_rate": 1.880492270565748e-07, "loss": 1.2664, "step": 34421 }, { "epoch": 0.94, "learning_rate": 1.878785390060145e-07, "loss": 1.7949, "step": 34422 }, { "epoch": 0.94, "learning_rate": 1.877079277208793e-07, "loss": 1.2634, "step": 34423 }, { "epoch": 0.94, "learning_rate": 1.8753739320250153e-07, "loss": 1.3125, "step": 34424 }, { "epoch": 0.94, "learning_rate": 1.8736693545222008e-07, "loss": 1.2773, "step": 34425 }, { "epoch": 0.94, "learning_rate": 1.8719655447136275e-07, "loss": 1.1355, "step": 34426 }, { "epoch": 0.94, "learning_rate": 1.870262502612663e-07, "loss": 1.1426, "step": 34427 }, { "epoch": 0.94, "learning_rate": 1.8685602282326077e-07, "loss": 1.3394, "step": 34428 }, { "epoch": 0.94, "learning_rate": 1.8668587215868172e-07, "loss": 1.3398, "step": 34429 }, { "epoch": 0.94, "learning_rate": 1.8651579826885592e-07, "loss": 1.3213, "step": 34430 }, { "epoch": 0.94, "learning_rate": 1.8634580115511668e-07, "loss": 1.2712, "step": 34431 }, { "epoch": 0.94, "learning_rate": 1.86175880818793e-07, "loss": 1.2437, "step": 34432 }, { "epoch": 0.94, "learning_rate": 1.860060372612149e-07, "loss": 1.2266, "step": 34433 }, { "epoch": 0.94, "learning_rate": 1.8583627048371023e-07, "loss": 1.3152, "step": 34434 }, { "epoch": 0.94, "learning_rate": 1.8566658048760677e-07, "loss": 1.1714, "step": 34435 }, { "epoch": 0.94, "learning_rate": 1.8549696727423462e-07, "loss": 1.2297, "step": 34436 }, { "epoch": 0.94, "learning_rate": 1.8532743084491822e-07, "loss": 1.3103, "step": 34437 }, { "epoch": 0.94, "learning_rate": 1.8515797120098543e-07, "loss": 1.2708, "step": 34438 }, { "epoch": 0.94, "learning_rate": 1.8498858834375964e-07, "loss": 1.311, "step": 34439 }, { "epoch": 0.94, "learning_rate": 1.848192822745698e-07, "loss": 1.3096, "step": 34440 }, { "epoch": 0.94, "learning_rate": 1.8465005299473816e-07, "loss": 1.0657, "step": 34441 }, { "epoch": 0.94, "learning_rate": 1.844809005055881e-07, "loss": 1.2959, "step": 34442 }, { "epoch": 0.94, "learning_rate": 1.8431182480844412e-07, "loss": 1.1392, "step": 34443 }, { "epoch": 0.94, "learning_rate": 1.841428259046296e-07, "loss": 1.2864, "step": 34444 }, { "epoch": 0.94, "learning_rate": 1.8397390379546576e-07, "loss": 1.3394, "step": 34445 }, { "epoch": 0.94, "learning_rate": 1.838050584822726e-07, "loss": 1.2998, "step": 34446 }, { "epoch": 0.94, "learning_rate": 1.836362899663746e-07, "loss": 1.272, "step": 34447 }, { "epoch": 0.94, "learning_rate": 1.8346759824908966e-07, "loss": 1.3315, "step": 34448 }, { "epoch": 0.94, "learning_rate": 1.832989833317389e-07, "loss": 1.2449, "step": 34449 }, { "epoch": 0.94, "learning_rate": 1.8313044521563905e-07, "loss": 1.6729, "step": 34450 }, { "epoch": 0.94, "learning_rate": 1.8296198390211128e-07, "loss": 1.2595, "step": 34451 }, { "epoch": 0.94, "learning_rate": 1.8279359939247342e-07, "loss": 1.3538, "step": 34452 }, { "epoch": 0.94, "learning_rate": 1.826252916880411e-07, "loss": 1.0015, "step": 34453 }, { "epoch": 0.94, "learning_rate": 1.8245706079013214e-07, "loss": 1.1409, "step": 34454 }, { "epoch": 0.94, "learning_rate": 1.8228890670006328e-07, "loss": 1.2202, "step": 34455 }, { "epoch": 0.94, "learning_rate": 1.82120829419149e-07, "loss": 0.9717, "step": 34456 }, { "epoch": 0.94, "learning_rate": 1.819528289487049e-07, "loss": 1.2432, "step": 34457 }, { "epoch": 0.94, "learning_rate": 1.8178490529004333e-07, "loss": 1.2844, "step": 34458 }, { "epoch": 0.94, "learning_rate": 1.8161705844448208e-07, "loss": 1.1311, "step": 34459 }, { "epoch": 0.94, "learning_rate": 1.814492884133312e-07, "loss": 1.3176, "step": 34460 }, { "epoch": 0.94, "learning_rate": 1.8128159519790412e-07, "loss": 1.2593, "step": 34461 }, { "epoch": 0.94, "learning_rate": 1.8111397879951198e-07, "loss": 1.2688, "step": 34462 }, { "epoch": 0.94, "learning_rate": 1.8094643921946707e-07, "loss": 1.1274, "step": 34463 }, { "epoch": 0.94, "learning_rate": 1.8077897645908172e-07, "loss": 1.3091, "step": 34464 }, { "epoch": 0.94, "learning_rate": 1.806115905196626e-07, "loss": 1.2844, "step": 34465 }, { "epoch": 0.94, "learning_rate": 1.80444281402522e-07, "loss": 1.3276, "step": 34466 }, { "epoch": 0.94, "learning_rate": 1.802770491089667e-07, "loss": 1.3413, "step": 34467 }, { "epoch": 0.94, "learning_rate": 1.8010989364030783e-07, "loss": 1.271, "step": 34468 }, { "epoch": 0.94, "learning_rate": 1.7994281499784994e-07, "loss": 1.1909, "step": 34469 }, { "epoch": 0.94, "learning_rate": 1.7977581318290304e-07, "loss": 1.2742, "step": 34470 }, { "epoch": 0.94, "learning_rate": 1.796088881967717e-07, "loss": 1.4041, "step": 34471 }, { "epoch": 0.94, "learning_rate": 1.794420400407626e-07, "loss": 1.312, "step": 34472 }, { "epoch": 0.94, "learning_rate": 1.792752687161814e-07, "loss": 1.2969, "step": 34473 }, { "epoch": 0.94, "learning_rate": 1.7910857422433147e-07, "loss": 1.238, "step": 34474 }, { "epoch": 0.94, "learning_rate": 1.7894195656651847e-07, "loss": 1.2512, "step": 34475 }, { "epoch": 0.94, "learning_rate": 1.7877541574404577e-07, "loss": 1.1978, "step": 34476 }, { "epoch": 0.94, "learning_rate": 1.7860895175821568e-07, "loss": 1.2273, "step": 34477 }, { "epoch": 0.94, "learning_rate": 1.784425646103305e-07, "loss": 1.2134, "step": 34478 }, { "epoch": 0.94, "learning_rate": 1.7827625430169249e-07, "loss": 1.2544, "step": 34479 }, { "epoch": 0.94, "learning_rate": 1.7811002083360286e-07, "loss": 1.0793, "step": 34480 }, { "epoch": 0.94, "learning_rate": 1.7794386420736275e-07, "loss": 1.3016, "step": 34481 }, { "epoch": 0.94, "learning_rate": 1.7777778442426896e-07, "loss": 1.1377, "step": 34482 }, { "epoch": 0.94, "learning_rate": 1.7761178148562486e-07, "loss": 1.2856, "step": 34483 }, { "epoch": 0.94, "learning_rate": 1.7744585539272719e-07, "loss": 1.1758, "step": 34484 }, { "epoch": 0.94, "learning_rate": 1.772800061468738e-07, "loss": 1.1475, "step": 34485 }, { "epoch": 0.94, "learning_rate": 1.7711423374936142e-07, "loss": 1.2305, "step": 34486 }, { "epoch": 0.94, "learning_rate": 1.7694853820149016e-07, "loss": 1.2944, "step": 34487 }, { "epoch": 0.94, "learning_rate": 1.7678291950455339e-07, "loss": 1.7681, "step": 34488 }, { "epoch": 0.94, "learning_rate": 1.7661737765984898e-07, "loss": 1.2656, "step": 34489 }, { "epoch": 0.94, "learning_rate": 1.7645191266866924e-07, "loss": 1.3191, "step": 34490 }, { "epoch": 0.94, "learning_rate": 1.76286524532312e-07, "loss": 1.3477, "step": 34491 }, { "epoch": 0.94, "learning_rate": 1.7612121325206843e-07, "loss": 1.2263, "step": 34492 }, { "epoch": 0.94, "learning_rate": 1.759559788292331e-07, "loss": 1.2717, "step": 34493 }, { "epoch": 0.94, "learning_rate": 1.757908212650994e-07, "loss": 1.2539, "step": 34494 }, { "epoch": 0.94, "learning_rate": 1.756257405609585e-07, "loss": 1.2964, "step": 34495 }, { "epoch": 0.94, "learning_rate": 1.754607367181016e-07, "loss": 1.271, "step": 34496 }, { "epoch": 0.94, "learning_rate": 1.752958097378199e-07, "loss": 1.364, "step": 34497 }, { "epoch": 0.94, "learning_rate": 1.751309596214046e-07, "loss": 1.2795, "step": 34498 }, { "epoch": 0.94, "learning_rate": 1.7496618637014352e-07, "loss": 1.4219, "step": 34499 }, { "epoch": 0.94, "learning_rate": 1.7480148998532786e-07, "loss": 1.281, "step": 34500 }, { "epoch": 0.94, "learning_rate": 1.746368704682444e-07, "loss": 1.2561, "step": 34501 }, { "epoch": 0.94, "learning_rate": 1.744723278201832e-07, "loss": 1.2202, "step": 34502 }, { "epoch": 0.94, "learning_rate": 1.743078620424299e-07, "loss": 1.3313, "step": 34503 }, { "epoch": 0.94, "learning_rate": 1.741434731362712e-07, "loss": 1.2622, "step": 34504 }, { "epoch": 0.94, "learning_rate": 1.7397916110299285e-07, "loss": 1.3372, "step": 34505 }, { "epoch": 0.94, "learning_rate": 1.738149259438815e-07, "loss": 1.1846, "step": 34506 }, { "epoch": 0.94, "learning_rate": 1.736507676602217e-07, "loss": 1.3364, "step": 34507 }, { "epoch": 0.94, "learning_rate": 1.73486686253298e-07, "loss": 1.3071, "step": 34508 }, { "epoch": 0.94, "learning_rate": 1.7332268172439272e-07, "loss": 1.2708, "step": 34509 }, { "epoch": 0.94, "learning_rate": 1.731587540747903e-07, "loss": 1.281, "step": 34510 }, { "epoch": 0.94, "learning_rate": 1.7299490330577316e-07, "loss": 1.3225, "step": 34511 }, { "epoch": 0.94, "learning_rate": 1.7283112941862357e-07, "loss": 1.6494, "step": 34512 }, { "epoch": 0.94, "learning_rate": 1.726674324146216e-07, "loss": 1.2246, "step": 34513 }, { "epoch": 0.94, "learning_rate": 1.725038122950473e-07, "loss": 1.228, "step": 34514 }, { "epoch": 0.94, "learning_rate": 1.7234026906118306e-07, "loss": 1.3079, "step": 34515 }, { "epoch": 0.94, "learning_rate": 1.7217680271430782e-07, "loss": 1.2703, "step": 34516 }, { "epoch": 0.94, "learning_rate": 1.7201341325569943e-07, "loss": 1.1069, "step": 34517 }, { "epoch": 0.94, "learning_rate": 1.7185010068663576e-07, "loss": 1.4309, "step": 34518 }, { "epoch": 0.94, "learning_rate": 1.7168686500839694e-07, "loss": 1.2263, "step": 34519 }, { "epoch": 0.94, "learning_rate": 1.7152370622225744e-07, "loss": 1.2388, "step": 34520 }, { "epoch": 0.94, "learning_rate": 1.713606243294963e-07, "loss": 1.415, "step": 34521 }, { "epoch": 0.94, "learning_rate": 1.711976193313858e-07, "loss": 1.3838, "step": 34522 }, { "epoch": 0.94, "learning_rate": 1.710346912292038e-07, "loss": 1.1621, "step": 34523 }, { "epoch": 0.94, "learning_rate": 1.7087184002422485e-07, "loss": 1.3281, "step": 34524 }, { "epoch": 0.94, "learning_rate": 1.7070906571772238e-07, "loss": 1.2068, "step": 34525 }, { "epoch": 0.94, "learning_rate": 1.7054636831097092e-07, "loss": 1.2349, "step": 34526 }, { "epoch": 0.94, "learning_rate": 1.703837478052417e-07, "loss": 1.2212, "step": 34527 }, { "epoch": 0.94, "learning_rate": 1.702212042018092e-07, "loss": 1.2068, "step": 34528 }, { "epoch": 0.94, "learning_rate": 1.7005873750194135e-07, "loss": 1.311, "step": 34529 }, { "epoch": 0.94, "learning_rate": 1.6989634770691264e-07, "loss": 1.3977, "step": 34530 }, { "epoch": 0.94, "learning_rate": 1.697340348179932e-07, "loss": 1.2415, "step": 34531 }, { "epoch": 0.94, "learning_rate": 1.6957179883645204e-07, "loss": 1.3064, "step": 34532 }, { "epoch": 0.94, "learning_rate": 1.6940963976355806e-07, "loss": 1.4546, "step": 34533 }, { "epoch": 0.94, "learning_rate": 1.692475576005803e-07, "loss": 1.119, "step": 34534 }, { "epoch": 0.94, "learning_rate": 1.6908555234878665e-07, "loss": 1.27, "step": 34535 }, { "epoch": 0.94, "learning_rate": 1.6892362400944606e-07, "loss": 1.4282, "step": 34536 }, { "epoch": 0.94, "learning_rate": 1.687617725838231e-07, "loss": 1.3606, "step": 34537 }, { "epoch": 0.94, "learning_rate": 1.685999980731845e-07, "loss": 1.3655, "step": 34538 }, { "epoch": 0.94, "learning_rate": 1.6843830047879818e-07, "loss": 1.3416, "step": 34539 }, { "epoch": 0.94, "learning_rate": 1.682766798019253e-07, "loss": 1.2852, "step": 34540 }, { "epoch": 0.94, "learning_rate": 1.681151360438349e-07, "loss": 1.0957, "step": 34541 }, { "epoch": 0.94, "learning_rate": 1.6795366920578593e-07, "loss": 1.1028, "step": 34542 }, { "epoch": 0.94, "learning_rate": 1.677922792890463e-07, "loss": 1.3037, "step": 34543 }, { "epoch": 0.94, "learning_rate": 1.6763096629487497e-07, "loss": 1.2551, "step": 34544 }, { "epoch": 0.94, "learning_rate": 1.674697302245365e-07, "loss": 1.1453, "step": 34545 }, { "epoch": 0.94, "learning_rate": 1.673085710792899e-07, "loss": 1.2451, "step": 34546 }, { "epoch": 0.94, "learning_rate": 1.6714748886039966e-07, "loss": 1.3271, "step": 34547 }, { "epoch": 0.94, "learning_rate": 1.669864835691215e-07, "loss": 1.2917, "step": 34548 }, { "epoch": 0.94, "learning_rate": 1.6682555520671883e-07, "loss": 1.437, "step": 34549 }, { "epoch": 0.94, "learning_rate": 1.6666470377444733e-07, "loss": 1.1238, "step": 34550 }, { "epoch": 0.94, "learning_rate": 1.6650392927356928e-07, "loss": 1.3062, "step": 34551 }, { "epoch": 0.94, "learning_rate": 1.6634323170533928e-07, "loss": 1.2659, "step": 34552 }, { "epoch": 0.94, "learning_rate": 1.661826110710163e-07, "loss": 1.2134, "step": 34553 }, { "epoch": 0.94, "learning_rate": 1.6602206737185488e-07, "loss": 1.2363, "step": 34554 }, { "epoch": 0.94, "learning_rate": 1.6586160060911406e-07, "loss": 1.3252, "step": 34555 }, { "epoch": 0.94, "learning_rate": 1.657012107840472e-07, "loss": 1.2744, "step": 34556 }, { "epoch": 0.94, "learning_rate": 1.6554089789791007e-07, "loss": 1.2368, "step": 34557 }, { "epoch": 0.94, "learning_rate": 1.65380661951956e-07, "loss": 1.2969, "step": 34558 }, { "epoch": 0.94, "learning_rate": 1.6522050294743964e-07, "loss": 1.2805, "step": 34559 }, { "epoch": 0.94, "learning_rate": 1.6506042088561325e-07, "loss": 1.2065, "step": 34560 }, { "epoch": 0.94, "learning_rate": 1.6490041576772808e-07, "loss": 1.2734, "step": 34561 }, { "epoch": 0.94, "learning_rate": 1.6474048759503868e-07, "loss": 1.1709, "step": 34562 }, { "epoch": 0.94, "learning_rate": 1.6458063636879517e-07, "loss": 1.085, "step": 34563 }, { "epoch": 0.94, "learning_rate": 1.6442086209024764e-07, "loss": 1.2405, "step": 34564 }, { "epoch": 0.94, "learning_rate": 1.6426116476064512e-07, "loss": 1.322, "step": 34565 }, { "epoch": 0.94, "learning_rate": 1.6410154438123882e-07, "loss": 1.3259, "step": 34566 }, { "epoch": 0.94, "learning_rate": 1.6394200095327772e-07, "loss": 1.2722, "step": 34567 }, { "epoch": 0.94, "learning_rate": 1.6378253447800863e-07, "loss": 1.1863, "step": 34568 }, { "epoch": 0.94, "learning_rate": 1.636231449566783e-07, "loss": 1.177, "step": 34569 }, { "epoch": 0.94, "learning_rate": 1.6346383239053686e-07, "loss": 1.3347, "step": 34570 }, { "epoch": 0.94, "learning_rate": 1.633045967808289e-07, "loss": 1.2781, "step": 34571 }, { "epoch": 0.94, "learning_rate": 1.631454381287989e-07, "loss": 1.3201, "step": 34572 }, { "epoch": 0.94, "learning_rate": 1.629863564356937e-07, "loss": 1.3191, "step": 34573 }, { "epoch": 0.94, "learning_rate": 1.6282735170275897e-07, "loss": 1.0818, "step": 34574 }, { "epoch": 0.94, "learning_rate": 1.6266842393123595e-07, "loss": 1.1748, "step": 34575 }, { "epoch": 0.94, "learning_rate": 1.6250957312236916e-07, "loss": 1.2607, "step": 34576 }, { "epoch": 0.94, "learning_rate": 1.6235079927740205e-07, "loss": 1.1038, "step": 34577 }, { "epoch": 0.94, "learning_rate": 1.62192102397577e-07, "loss": 1.1641, "step": 34578 }, { "epoch": 0.94, "learning_rate": 1.6203348248413408e-07, "loss": 1.2893, "step": 34579 }, { "epoch": 0.94, "learning_rate": 1.6187493953831456e-07, "loss": 1.3354, "step": 34580 }, { "epoch": 0.94, "learning_rate": 1.6171647356136077e-07, "loss": 1.1787, "step": 34581 }, { "epoch": 0.94, "learning_rate": 1.615580845545095e-07, "loss": 1.3728, "step": 34582 }, { "epoch": 0.94, "learning_rate": 1.6139977251900308e-07, "loss": 1.3799, "step": 34583 }, { "epoch": 0.94, "learning_rate": 1.6124153745607607e-07, "loss": 1.3652, "step": 34584 }, { "epoch": 0.94, "learning_rate": 1.6108337936697082e-07, "loss": 1.3242, "step": 34585 }, { "epoch": 0.94, "learning_rate": 1.609252982529219e-07, "loss": 1.0093, "step": 34586 }, { "epoch": 0.94, "learning_rate": 1.6076729411516613e-07, "loss": 1.249, "step": 34587 }, { "epoch": 0.94, "learning_rate": 1.6060936695494133e-07, "loss": 1.1838, "step": 34588 }, { "epoch": 0.94, "learning_rate": 1.6045151677348103e-07, "loss": 1.1753, "step": 34589 }, { "epoch": 0.94, "learning_rate": 1.602937435720231e-07, "loss": 1.2485, "step": 34590 }, { "epoch": 0.94, "learning_rate": 1.6013604735179768e-07, "loss": 1.2498, "step": 34591 }, { "epoch": 0.94, "learning_rate": 1.5997842811404263e-07, "loss": 0.928, "step": 34592 }, { "epoch": 0.94, "learning_rate": 1.59820885859987e-07, "loss": 1.2571, "step": 34593 }, { "epoch": 0.94, "learning_rate": 1.596634205908687e-07, "loss": 1.3455, "step": 34594 }, { "epoch": 0.94, "learning_rate": 1.595060323079145e-07, "loss": 1.3027, "step": 34595 }, { "epoch": 0.94, "learning_rate": 1.5934872101235787e-07, "loss": 1.2959, "step": 34596 }, { "epoch": 0.94, "learning_rate": 1.5919148670542895e-07, "loss": 1.2822, "step": 34597 }, { "epoch": 0.94, "learning_rate": 1.5903432938836005e-07, "loss": 1.3499, "step": 34598 }, { "epoch": 0.94, "learning_rate": 1.58877249062378e-07, "loss": 1.2639, "step": 34599 }, { "epoch": 0.94, "learning_rate": 1.5872024572871292e-07, "loss": 1.1941, "step": 34600 }, { "epoch": 0.94, "learning_rate": 1.585633193885927e-07, "loss": 1.3003, "step": 34601 }, { "epoch": 0.94, "learning_rate": 1.5840647004324527e-07, "loss": 1.3525, "step": 34602 }, { "epoch": 0.94, "learning_rate": 1.5824969769389854e-07, "loss": 1.1812, "step": 34603 }, { "epoch": 0.95, "learning_rate": 1.5809300234177705e-07, "loss": 1.344, "step": 34604 }, { "epoch": 0.95, "learning_rate": 1.5793638398810873e-07, "loss": 1.2318, "step": 34605 }, { "epoch": 0.95, "learning_rate": 1.5777984263411818e-07, "loss": 1.1882, "step": 34606 }, { "epoch": 0.95, "learning_rate": 1.5762337828102992e-07, "loss": 1.2717, "step": 34607 }, { "epoch": 0.95, "learning_rate": 1.5746699093006746e-07, "loss": 1.1501, "step": 34608 }, { "epoch": 0.95, "learning_rate": 1.5731068058245535e-07, "loss": 1.3105, "step": 34609 }, { "epoch": 0.95, "learning_rate": 1.5715444723941597e-07, "loss": 1.3032, "step": 34610 }, { "epoch": 0.95, "learning_rate": 1.569982909021728e-07, "loss": 1.188, "step": 34611 }, { "epoch": 0.95, "learning_rate": 1.568422115719448e-07, "loss": 1.1223, "step": 34612 }, { "epoch": 0.95, "learning_rate": 1.5668620924995547e-07, "loss": 1.1848, "step": 34613 }, { "epoch": 0.95, "learning_rate": 1.5653028393742498e-07, "loss": 1.2585, "step": 34614 }, { "epoch": 0.95, "learning_rate": 1.563744356355734e-07, "loss": 1.1617, "step": 34615 }, { "epoch": 0.95, "learning_rate": 1.562186643456176e-07, "loss": 1.2307, "step": 34616 }, { "epoch": 0.95, "learning_rate": 1.560629700687799e-07, "loss": 1.2322, "step": 34617 }, { "epoch": 0.95, "learning_rate": 1.55907352806276e-07, "loss": 1.2378, "step": 34618 }, { "epoch": 0.95, "learning_rate": 1.557518125593227e-07, "loss": 1.2385, "step": 34619 }, { "epoch": 0.95, "learning_rate": 1.5559634932914015e-07, "loss": 1.1316, "step": 34620 }, { "epoch": 0.95, "learning_rate": 1.5544096311694179e-07, "loss": 1.1948, "step": 34621 }, { "epoch": 0.95, "learning_rate": 1.5528565392394446e-07, "loss": 1.3594, "step": 34622 }, { "epoch": 0.95, "learning_rate": 1.5513042175136161e-07, "loss": 1.3064, "step": 34623 }, { "epoch": 0.95, "learning_rate": 1.5497526660041008e-07, "loss": 1.2263, "step": 34624 }, { "epoch": 0.95, "learning_rate": 1.5482018847230218e-07, "loss": 1.312, "step": 34625 }, { "epoch": 0.95, "learning_rate": 1.5466518736825142e-07, "loss": 1.1663, "step": 34626 }, { "epoch": 0.95, "learning_rate": 1.5451026328947017e-07, "loss": 1.0796, "step": 34627 }, { "epoch": 0.95, "learning_rate": 1.5435541623717188e-07, "loss": 1.2397, "step": 34628 }, { "epoch": 0.95, "learning_rate": 1.542006462125678e-07, "loss": 1.0688, "step": 34629 }, { "epoch": 0.95, "learning_rate": 1.54045953216867e-07, "loss": 1.3174, "step": 34630 }, { "epoch": 0.95, "learning_rate": 1.538913372512807e-07, "loss": 1.21, "step": 34631 }, { "epoch": 0.95, "learning_rate": 1.5373679831701794e-07, "loss": 1.2056, "step": 34632 }, { "epoch": 0.95, "learning_rate": 1.5358233641528996e-07, "loss": 1.7148, "step": 34633 }, { "epoch": 0.95, "learning_rate": 1.534279515473025e-07, "loss": 1.4702, "step": 34634 }, { "epoch": 0.95, "learning_rate": 1.5327364371426567e-07, "loss": 1.1487, "step": 34635 }, { "epoch": 0.95, "learning_rate": 1.5311941291738408e-07, "loss": 1.0874, "step": 34636 }, { "epoch": 0.95, "learning_rate": 1.5296525915786786e-07, "loss": 1.1902, "step": 34637 }, { "epoch": 0.95, "learning_rate": 1.528111824369194e-07, "loss": 1.1956, "step": 34638 }, { "epoch": 0.95, "learning_rate": 1.5265718275574658e-07, "loss": 1.261, "step": 34639 }, { "epoch": 0.95, "learning_rate": 1.5250326011555183e-07, "loss": 1.2668, "step": 34640 }, { "epoch": 0.95, "learning_rate": 1.5234941451754415e-07, "loss": 1.3345, "step": 34641 }, { "epoch": 0.95, "learning_rate": 1.5219564596292146e-07, "loss": 1.1025, "step": 34642 }, { "epoch": 0.95, "learning_rate": 1.5204195445288948e-07, "loss": 1.3364, "step": 34643 }, { "epoch": 0.95, "learning_rate": 1.518883399886506e-07, "loss": 1.2178, "step": 34644 }, { "epoch": 0.95, "learning_rate": 1.5173480257140715e-07, "loss": 1.3677, "step": 34645 }, { "epoch": 0.95, "learning_rate": 1.515813422023593e-07, "loss": 1.334, "step": 34646 }, { "epoch": 0.95, "learning_rate": 1.5142795888270834e-07, "loss": 1.1768, "step": 34647 }, { "epoch": 0.95, "learning_rate": 1.5127465261365215e-07, "loss": 1.2788, "step": 34648 }, { "epoch": 0.95, "learning_rate": 1.5112142339639312e-07, "loss": 1.1987, "step": 34649 }, { "epoch": 0.95, "learning_rate": 1.509682712321292e-07, "loss": 1.1738, "step": 34650 }, { "epoch": 0.95, "learning_rate": 1.508151961220572e-07, "loss": 1.2175, "step": 34651 }, { "epoch": 0.95, "learning_rate": 1.5066219806737724e-07, "loss": 1.2385, "step": 34652 }, { "epoch": 0.95, "learning_rate": 1.5050927706928397e-07, "loss": 1.0442, "step": 34653 }, { "epoch": 0.95, "learning_rate": 1.503564331289742e-07, "loss": 1.0659, "step": 34654 }, { "epoch": 0.95, "learning_rate": 1.502036662476436e-07, "loss": 1.0674, "step": 34655 }, { "epoch": 0.95, "learning_rate": 1.5005097642648902e-07, "loss": 1.2141, "step": 34656 }, { "epoch": 0.95, "learning_rate": 1.4989836366670284e-07, "loss": 1.324, "step": 34657 }, { "epoch": 0.95, "learning_rate": 1.4974582796948078e-07, "loss": 1.271, "step": 34658 }, { "epoch": 0.95, "learning_rate": 1.4959336933601521e-07, "loss": 1.1436, "step": 34659 }, { "epoch": 0.95, "learning_rate": 1.4944098776749849e-07, "loss": 1.269, "step": 34660 }, { "epoch": 0.95, "learning_rate": 1.4928868326512414e-07, "loss": 1.3306, "step": 34661 }, { "epoch": 0.95, "learning_rate": 1.491364558300834e-07, "loss": 1.3147, "step": 34662 }, { "epoch": 0.95, "learning_rate": 1.4898430546356536e-07, "loss": 1.2512, "step": 34663 }, { "epoch": 0.95, "learning_rate": 1.4883223216676346e-07, "loss": 1.4224, "step": 34664 }, { "epoch": 0.95, "learning_rate": 1.4868023594086568e-07, "loss": 1.27, "step": 34665 }, { "epoch": 0.95, "learning_rate": 1.4852831678705992e-07, "loss": 1.1062, "step": 34666 }, { "epoch": 0.95, "learning_rate": 1.4837647470653748e-07, "loss": 1.6499, "step": 34667 }, { "epoch": 0.95, "learning_rate": 1.482247097004841e-07, "loss": 1.1455, "step": 34668 }, { "epoch": 0.95, "learning_rate": 1.4807302177008874e-07, "loss": 1.1914, "step": 34669 }, { "epoch": 0.95, "learning_rate": 1.479214109165361e-07, "loss": 1.1028, "step": 34670 }, { "epoch": 0.95, "learning_rate": 1.477698771410152e-07, "loss": 1.2771, "step": 34671 }, { "epoch": 0.95, "learning_rate": 1.4761842044470842e-07, "loss": 1.385, "step": 34672 }, { "epoch": 0.95, "learning_rate": 1.474670408288037e-07, "loss": 1.0602, "step": 34673 }, { "epoch": 0.95, "learning_rate": 1.473157382944823e-07, "loss": 1.3406, "step": 34674 }, { "epoch": 0.95, "learning_rate": 1.471645128429311e-07, "loss": 1.303, "step": 34675 }, { "epoch": 0.95, "learning_rate": 1.470133644753302e-07, "loss": 1.0935, "step": 34676 }, { "epoch": 0.95, "learning_rate": 1.4686229319286428e-07, "loss": 1.2639, "step": 34677 }, { "epoch": 0.95, "learning_rate": 1.4671129899671454e-07, "loss": 1.1726, "step": 34678 }, { "epoch": 0.95, "learning_rate": 1.465603818880612e-07, "loss": 1.3884, "step": 34679 }, { "epoch": 0.95, "learning_rate": 1.4640954186808775e-07, "loss": 1.7104, "step": 34680 }, { "epoch": 0.95, "learning_rate": 1.4625877893797101e-07, "loss": 1.1372, "step": 34681 }, { "epoch": 0.95, "learning_rate": 1.461080930988934e-07, "loss": 1.2385, "step": 34682 }, { "epoch": 0.95, "learning_rate": 1.4595748435203062e-07, "loss": 1.2285, "step": 34683 }, { "epoch": 0.95, "learning_rate": 1.4580695269856505e-07, "loss": 1.2515, "step": 34684 }, { "epoch": 0.95, "learning_rate": 1.456564981396702e-07, "loss": 1.2188, "step": 34685 }, { "epoch": 0.95, "learning_rate": 1.4550612067652627e-07, "loss": 1.3518, "step": 34686 }, { "epoch": 0.95, "learning_rate": 1.4535582031030782e-07, "loss": 1.1729, "step": 34687 }, { "epoch": 0.95, "learning_rate": 1.4520559704219283e-07, "loss": 1.1943, "step": 34688 }, { "epoch": 0.95, "learning_rate": 1.4505545087335372e-07, "loss": 1.199, "step": 34689 }, { "epoch": 0.95, "learning_rate": 1.4490538180496727e-07, "loss": 1.3135, "step": 34690 }, { "epoch": 0.95, "learning_rate": 1.4475538983820592e-07, "loss": 1.1659, "step": 34691 }, { "epoch": 0.95, "learning_rate": 1.4460547497424537e-07, "loss": 1.2654, "step": 34692 }, { "epoch": 0.95, "learning_rate": 1.4445563721425692e-07, "loss": 1.2458, "step": 34693 }, { "epoch": 0.95, "learning_rate": 1.4430587655941187e-07, "loss": 1.2766, "step": 34694 }, { "epoch": 0.95, "learning_rate": 1.441561930108848e-07, "loss": 1.3323, "step": 34695 }, { "epoch": 0.95, "learning_rate": 1.4400658656984478e-07, "loss": 1.3296, "step": 34696 }, { "epoch": 0.95, "learning_rate": 1.4385705723746313e-07, "loss": 1.1619, "step": 34697 }, { "epoch": 0.95, "learning_rate": 1.4370760501490778e-07, "loss": 1.1582, "step": 34698 }, { "epoch": 0.95, "learning_rate": 1.4355822990335e-07, "loss": 1.1405, "step": 34699 }, { "epoch": 0.95, "learning_rate": 1.4340893190395888e-07, "loss": 1.176, "step": 34700 }, { "epoch": 0.95, "learning_rate": 1.4325971101790015e-07, "loss": 1.3035, "step": 34701 }, { "epoch": 0.95, "learning_rate": 1.4311056724634286e-07, "loss": 1.2253, "step": 34702 }, { "epoch": 0.95, "learning_rate": 1.4296150059045276e-07, "loss": 1.3184, "step": 34703 }, { "epoch": 0.95, "learning_rate": 1.4281251105139782e-07, "loss": 1.3438, "step": 34704 }, { "epoch": 0.95, "learning_rate": 1.4266359863034263e-07, "loss": 1.2837, "step": 34705 }, { "epoch": 0.95, "learning_rate": 1.425147633284518e-07, "loss": 1.3123, "step": 34706 }, { "epoch": 0.95, "learning_rate": 1.4236600514689003e-07, "loss": 1.6211, "step": 34707 }, { "epoch": 0.95, "learning_rate": 1.4221732408682188e-07, "loss": 1.2036, "step": 34708 }, { "epoch": 0.95, "learning_rate": 1.4206872014940863e-07, "loss": 1.3105, "step": 34709 }, { "epoch": 0.95, "learning_rate": 1.4192019333581498e-07, "loss": 1.2668, "step": 34710 }, { "epoch": 0.95, "learning_rate": 1.4177174364720215e-07, "loss": 1.2081, "step": 34711 }, { "epoch": 0.95, "learning_rate": 1.4162337108473145e-07, "loss": 1.2461, "step": 34712 }, { "epoch": 0.95, "learning_rate": 1.414750756495631e-07, "loss": 1.2686, "step": 34713 }, { "epoch": 0.95, "learning_rate": 1.4132685734285944e-07, "loss": 1.2339, "step": 34714 }, { "epoch": 0.95, "learning_rate": 1.411787161657774e-07, "loss": 1.146, "step": 34715 }, { "epoch": 0.95, "learning_rate": 1.410306521194782e-07, "loss": 1.2166, "step": 34716 }, { "epoch": 0.95, "learning_rate": 1.408826652051176e-07, "loss": 1.301, "step": 34717 }, { "epoch": 0.95, "learning_rate": 1.4073475542385585e-07, "loss": 1.2131, "step": 34718 }, { "epoch": 0.95, "learning_rate": 1.405869227768497e-07, "loss": 1.1812, "step": 34719 }, { "epoch": 0.95, "learning_rate": 1.4043916726525496e-07, "loss": 1.3486, "step": 34720 }, { "epoch": 0.95, "learning_rate": 1.4029148889022736e-07, "loss": 1.2939, "step": 34721 }, { "epoch": 0.95, "learning_rate": 1.4014388765292375e-07, "loss": 1.2747, "step": 34722 }, { "epoch": 0.95, "learning_rate": 1.3999636355449654e-07, "loss": 1.2131, "step": 34723 }, { "epoch": 0.95, "learning_rate": 1.3984891659610257e-07, "loss": 1.2467, "step": 34724 }, { "epoch": 0.95, "learning_rate": 1.3970154677889313e-07, "loss": 1.3472, "step": 34725 }, { "epoch": 0.95, "learning_rate": 1.395542541040218e-07, "loss": 1.1301, "step": 34726 }, { "epoch": 0.95, "learning_rate": 1.3940703857264314e-07, "loss": 1.3542, "step": 34727 }, { "epoch": 0.95, "learning_rate": 1.3925990018590518e-07, "loss": 1.3777, "step": 34728 }, { "epoch": 0.95, "learning_rate": 1.3911283894496253e-07, "loss": 1.2617, "step": 34729 }, { "epoch": 0.95, "learning_rate": 1.3896585485096204e-07, "loss": 1.2817, "step": 34730 }, { "epoch": 0.95, "learning_rate": 1.3881894790505834e-07, "loss": 1.2856, "step": 34731 }, { "epoch": 0.95, "learning_rate": 1.386721181083961e-07, "loss": 1.3154, "step": 34732 }, { "epoch": 0.95, "learning_rate": 1.3852536546212657e-07, "loss": 1.231, "step": 34733 }, { "epoch": 0.95, "learning_rate": 1.383786899673978e-07, "loss": 1.1365, "step": 34734 }, { "epoch": 0.95, "learning_rate": 1.3823209162535768e-07, "loss": 1.2371, "step": 34735 }, { "epoch": 0.95, "learning_rate": 1.3808557043715088e-07, "loss": 1.314, "step": 34736 }, { "epoch": 0.95, "learning_rate": 1.3793912640392538e-07, "loss": 1.1971, "step": 34737 }, { "epoch": 0.95, "learning_rate": 1.377927595268269e-07, "loss": 1.3948, "step": 34738 }, { "epoch": 0.95, "learning_rate": 1.3764646980700013e-07, "loss": 1.0872, "step": 34739 }, { "epoch": 0.95, "learning_rate": 1.375002572455897e-07, "loss": 1.1736, "step": 34740 }, { "epoch": 0.95, "learning_rate": 1.373541218437402e-07, "loss": 1.3083, "step": 34741 }, { "epoch": 0.95, "learning_rate": 1.372080636025941e-07, "loss": 1.1133, "step": 34742 }, { "epoch": 0.95, "learning_rate": 1.3706208252329377e-07, "loss": 1.3452, "step": 34743 }, { "epoch": 0.95, "learning_rate": 1.3691617860698282e-07, "loss": 1.4546, "step": 34744 }, { "epoch": 0.95, "learning_rate": 1.3677035185480024e-07, "loss": 1.2781, "step": 34745 }, { "epoch": 0.95, "learning_rate": 1.3662460226788966e-07, "loss": 1.3447, "step": 34746 }, { "epoch": 0.95, "learning_rate": 1.3647892984739007e-07, "loss": 1.3772, "step": 34747 }, { "epoch": 0.95, "learning_rate": 1.3633333459444177e-07, "loss": 1.1294, "step": 34748 }, { "epoch": 0.95, "learning_rate": 1.3618781651018155e-07, "loss": 1.197, "step": 34749 }, { "epoch": 0.95, "learning_rate": 1.3604237559575073e-07, "loss": 1.3738, "step": 34750 }, { "epoch": 0.95, "learning_rate": 1.358970118522851e-07, "loss": 1.2322, "step": 34751 }, { "epoch": 0.95, "learning_rate": 1.3575172528092374e-07, "loss": 1.2256, "step": 34752 }, { "epoch": 0.95, "learning_rate": 1.3560651588280126e-07, "loss": 1.1658, "step": 34753 }, { "epoch": 0.95, "learning_rate": 1.354613836590568e-07, "loss": 1.0757, "step": 34754 }, { "epoch": 0.95, "learning_rate": 1.3531632861082277e-07, "loss": 1.231, "step": 34755 }, { "epoch": 0.95, "learning_rate": 1.3517135073923383e-07, "loss": 1.2229, "step": 34756 }, { "epoch": 0.95, "learning_rate": 1.350264500454268e-07, "loss": 1.7837, "step": 34757 }, { "epoch": 0.95, "learning_rate": 1.3488162653053416e-07, "loss": 1.2441, "step": 34758 }, { "epoch": 0.95, "learning_rate": 1.3473688019568831e-07, "loss": 1.1331, "step": 34759 }, { "epoch": 0.95, "learning_rate": 1.345922110420217e-07, "loss": 1.3264, "step": 34760 }, { "epoch": 0.95, "learning_rate": 1.3444761907066783e-07, "loss": 1.437, "step": 34761 }, { "epoch": 0.95, "learning_rate": 1.3430310428275584e-07, "loss": 1.3577, "step": 34762 }, { "epoch": 0.95, "learning_rate": 1.3415866667941813e-07, "loss": 1.3481, "step": 34763 }, { "epoch": 0.95, "learning_rate": 1.340143062617816e-07, "loss": 1.2996, "step": 34764 }, { "epoch": 0.95, "learning_rate": 1.3387002303097972e-07, "loss": 1.1667, "step": 34765 }, { "epoch": 0.95, "learning_rate": 1.3372581698813946e-07, "loss": 1.1951, "step": 34766 }, { "epoch": 0.95, "learning_rate": 1.3358168813438764e-07, "loss": 1.3066, "step": 34767 }, { "epoch": 0.95, "learning_rate": 1.334376364708534e-07, "loss": 1.2126, "step": 34768 }, { "epoch": 0.95, "learning_rate": 1.3329366199866467e-07, "loss": 1.3062, "step": 34769 }, { "epoch": 0.95, "learning_rate": 1.3314976471894504e-07, "loss": 1.3262, "step": 34770 }, { "epoch": 0.95, "learning_rate": 1.3300594463282467e-07, "loss": 1.3428, "step": 34771 }, { "epoch": 0.95, "learning_rate": 1.3286220174142382e-07, "loss": 1.1614, "step": 34772 }, { "epoch": 0.95, "learning_rate": 1.3271853604586826e-07, "loss": 1.3423, "step": 34773 }, { "epoch": 0.95, "learning_rate": 1.3257494754728485e-07, "loss": 1.2227, "step": 34774 }, { "epoch": 0.95, "learning_rate": 1.3243143624679488e-07, "loss": 1.2888, "step": 34775 }, { "epoch": 0.95, "learning_rate": 1.3228800214552085e-07, "loss": 1.2275, "step": 34776 }, { "epoch": 0.95, "learning_rate": 1.3214464524458514e-07, "loss": 1.2244, "step": 34777 }, { "epoch": 0.95, "learning_rate": 1.3200136554511022e-07, "loss": 1.3174, "step": 34778 }, { "epoch": 0.95, "learning_rate": 1.3185816304821632e-07, "loss": 1.2737, "step": 34779 }, { "epoch": 0.95, "learning_rate": 1.3171503775502358e-07, "loss": 1.1611, "step": 34780 }, { "epoch": 0.95, "learning_rate": 1.315719896666512e-07, "loss": 1.2549, "step": 34781 }, { "epoch": 0.95, "learning_rate": 1.3142901878422044e-07, "loss": 1.3347, "step": 34782 }, { "epoch": 0.95, "learning_rate": 1.3128612510884819e-07, "loss": 1.3005, "step": 34783 }, { "epoch": 0.95, "learning_rate": 1.3114330864165248e-07, "loss": 1.2957, "step": 34784 }, { "epoch": 0.95, "learning_rate": 1.3100056938375018e-07, "loss": 1.2083, "step": 34785 }, { "epoch": 0.95, "learning_rate": 1.3085790733625924e-07, "loss": 1.7256, "step": 34786 }, { "epoch": 0.95, "learning_rate": 1.307153225002955e-07, "loss": 1.2852, "step": 34787 }, { "epoch": 0.95, "learning_rate": 1.305728148769736e-07, "loss": 1.1714, "step": 34788 }, { "epoch": 0.95, "learning_rate": 1.304303844674104e-07, "loss": 1.2458, "step": 34789 }, { "epoch": 0.95, "learning_rate": 1.3028803127271728e-07, "loss": 1.3352, "step": 34790 }, { "epoch": 0.95, "learning_rate": 1.3014575529401108e-07, "loss": 1.3657, "step": 34791 }, { "epoch": 0.95, "learning_rate": 1.3000355653240204e-07, "loss": 1.2805, "step": 34792 }, { "epoch": 0.95, "learning_rate": 1.2986143498900484e-07, "loss": 1.238, "step": 34793 }, { "epoch": 0.95, "learning_rate": 1.2971939066492966e-07, "loss": 0.9653, "step": 34794 }, { "epoch": 0.95, "learning_rate": 1.29577423561289e-07, "loss": 1.3289, "step": 34795 }, { "epoch": 0.95, "learning_rate": 1.2943553367919305e-07, "loss": 1.2092, "step": 34796 }, { "epoch": 0.95, "learning_rate": 1.2929372101975314e-07, "loss": 1.0571, "step": 34797 }, { "epoch": 0.95, "learning_rate": 1.2915198558407616e-07, "loss": 1.3347, "step": 34798 }, { "epoch": 0.95, "learning_rate": 1.2901032737327345e-07, "loss": 1.3586, "step": 34799 }, { "epoch": 0.95, "learning_rate": 1.288687463884508e-07, "loss": 1.3657, "step": 34800 }, { "epoch": 0.95, "learning_rate": 1.2872724263071957e-07, "loss": 1.2368, "step": 34801 }, { "epoch": 0.95, "learning_rate": 1.2858581610118325e-07, "loss": 1.3435, "step": 34802 }, { "epoch": 0.95, "learning_rate": 1.284444668009488e-07, "loss": 1.3506, "step": 34803 }, { "epoch": 0.95, "learning_rate": 1.283031947311242e-07, "loss": 1.1899, "step": 34804 }, { "epoch": 0.95, "learning_rate": 1.2816199989281296e-07, "loss": 1.2, "step": 34805 }, { "epoch": 0.95, "learning_rate": 1.2802088228712096e-07, "loss": 1.2932, "step": 34806 }, { "epoch": 0.95, "learning_rate": 1.2787984191515058e-07, "loss": 1.2148, "step": 34807 }, { "epoch": 0.95, "learning_rate": 1.277388787780065e-07, "loss": 1.2512, "step": 34808 }, { "epoch": 0.95, "learning_rate": 1.275979928767901e-07, "loss": 1.1953, "step": 34809 }, { "epoch": 0.95, "learning_rate": 1.274571842126071e-07, "loss": 1.304, "step": 34810 }, { "epoch": 0.95, "learning_rate": 1.2731645278655448e-07, "loss": 1.1426, "step": 34811 }, { "epoch": 0.95, "learning_rate": 1.2717579859973573e-07, "loss": 1.1802, "step": 34812 }, { "epoch": 0.95, "learning_rate": 1.270352216532511e-07, "loss": 1.2122, "step": 34813 }, { "epoch": 0.95, "learning_rate": 1.2689472194820197e-07, "loss": 1.1836, "step": 34814 }, { "epoch": 0.95, "learning_rate": 1.2675429948568408e-07, "loss": 1.1389, "step": 34815 }, { "epoch": 0.95, "learning_rate": 1.266139542667988e-07, "loss": 1.2002, "step": 34816 }, { "epoch": 0.95, "learning_rate": 1.2647368629264189e-07, "loss": 1.4434, "step": 34817 }, { "epoch": 0.95, "learning_rate": 1.263334955643125e-07, "loss": 1.1545, "step": 34818 }, { "epoch": 0.95, "learning_rate": 1.2619338208290754e-07, "loss": 1.4106, "step": 34819 }, { "epoch": 0.95, "learning_rate": 1.2605334584952167e-07, "loss": 1.1775, "step": 34820 }, { "epoch": 0.95, "learning_rate": 1.2591338686525177e-07, "loss": 1.3484, "step": 34821 }, { "epoch": 0.95, "learning_rate": 1.2577350513119368e-07, "loss": 1.2209, "step": 34822 }, { "epoch": 0.95, "learning_rate": 1.256337006484387e-07, "loss": 1.2673, "step": 34823 }, { "epoch": 0.95, "learning_rate": 1.2549397341808266e-07, "loss": 1.0679, "step": 34824 }, { "epoch": 0.95, "learning_rate": 1.2535432344121912e-07, "loss": 1.304, "step": 34825 }, { "epoch": 0.95, "learning_rate": 1.2521475071894052e-07, "loss": 1.3992, "step": 34826 }, { "epoch": 0.95, "learning_rate": 1.250752552523371e-07, "loss": 1.123, "step": 34827 }, { "epoch": 0.95, "learning_rate": 1.2493583704250135e-07, "loss": 1.1655, "step": 34828 }, { "epoch": 0.95, "learning_rate": 1.2479649609052458e-07, "loss": 1.2063, "step": 34829 }, { "epoch": 0.95, "learning_rate": 1.2465723239749594e-07, "loss": 1.2439, "step": 34830 }, { "epoch": 0.95, "learning_rate": 1.2451804596450568e-07, "loss": 1.3081, "step": 34831 }, { "epoch": 0.95, "learning_rate": 1.243789367926418e-07, "loss": 1.3335, "step": 34832 }, { "epoch": 0.95, "learning_rate": 1.2423990488299453e-07, "loss": 1.2607, "step": 34833 }, { "epoch": 0.95, "learning_rate": 1.241009502366497e-07, "loss": 1.2351, "step": 34834 }, { "epoch": 0.95, "learning_rate": 1.239620728546953e-07, "loss": 1.3157, "step": 34835 }, { "epoch": 0.95, "learning_rate": 1.2382327273821716e-07, "loss": 1.3708, "step": 34836 }, { "epoch": 0.95, "learning_rate": 1.2368454988830213e-07, "loss": 1.2917, "step": 34837 }, { "epoch": 0.95, "learning_rate": 1.2354590430603497e-07, "loss": 1.2178, "step": 34838 }, { "epoch": 0.95, "learning_rate": 1.2340733599249922e-07, "loss": 1.2529, "step": 34839 }, { "epoch": 0.95, "learning_rate": 1.2326884494878178e-07, "loss": 1.2766, "step": 34840 }, { "epoch": 0.95, "learning_rate": 1.2313043117596402e-07, "loss": 1.2961, "step": 34841 }, { "epoch": 0.95, "learning_rate": 1.229920946751295e-07, "loss": 1.2957, "step": 34842 }, { "epoch": 0.95, "learning_rate": 1.2285383544735853e-07, "loss": 1.0928, "step": 34843 }, { "epoch": 0.95, "learning_rate": 1.227156534937368e-07, "loss": 1.1892, "step": 34844 }, { "epoch": 0.95, "learning_rate": 1.2257754881534246e-07, "loss": 1.022, "step": 34845 }, { "epoch": 0.95, "learning_rate": 1.2243952141325677e-07, "loss": 1.2651, "step": 34846 }, { "epoch": 0.95, "learning_rate": 1.223015712885589e-07, "loss": 1.125, "step": 34847 }, { "epoch": 0.95, "learning_rate": 1.2216369844232913e-07, "loss": 1.1873, "step": 34848 }, { "epoch": 0.95, "learning_rate": 1.2202590287564654e-07, "loss": 1.2429, "step": 34849 }, { "epoch": 0.95, "learning_rate": 1.2188818458958696e-07, "loss": 1.313, "step": 34850 }, { "epoch": 0.95, "learning_rate": 1.2175054358522954e-07, "loss": 1.3491, "step": 34851 }, { "epoch": 0.95, "learning_rate": 1.2161297986365117e-07, "loss": 1.282, "step": 34852 }, { "epoch": 0.95, "learning_rate": 1.2147549342592878e-07, "loss": 1.1443, "step": 34853 }, { "epoch": 0.95, "learning_rate": 1.2133808427313486e-07, "loss": 1.248, "step": 34854 }, { "epoch": 0.95, "learning_rate": 1.2120075240634743e-07, "loss": 1.3101, "step": 34855 }, { "epoch": 0.95, "learning_rate": 1.2106349782664005e-07, "loss": 1.3323, "step": 34856 }, { "epoch": 0.95, "learning_rate": 1.2092632053508636e-07, "loss": 1.2781, "step": 34857 }, { "epoch": 0.95, "learning_rate": 1.207892205327599e-07, "loss": 1.3296, "step": 34858 }, { "epoch": 0.95, "learning_rate": 1.2065219782073312e-07, "loss": 1.3633, "step": 34859 }, { "epoch": 0.95, "learning_rate": 1.2051525240007632e-07, "loss": 1.7021, "step": 34860 }, { "epoch": 0.95, "learning_rate": 1.2037838427186532e-07, "loss": 1.2502, "step": 34861 }, { "epoch": 0.95, "learning_rate": 1.202415934371659e-07, "loss": 1.2578, "step": 34862 }, { "epoch": 0.95, "learning_rate": 1.2010487989705166e-07, "loss": 1.1638, "step": 34863 }, { "epoch": 0.95, "learning_rate": 1.1996824365258953e-07, "loss": 1.3152, "step": 34864 }, { "epoch": 0.95, "learning_rate": 1.1983168470485085e-07, "loss": 1.2915, "step": 34865 }, { "epoch": 0.95, "learning_rate": 1.1969520305490368e-07, "loss": 1.3506, "step": 34866 }, { "epoch": 0.95, "learning_rate": 1.195587987038138e-07, "loss": 1.386, "step": 34867 }, { "epoch": 0.95, "learning_rate": 1.1942247165265152e-07, "loss": 1.3242, "step": 34868 }, { "epoch": 0.95, "learning_rate": 1.192862219024804e-07, "loss": 1.092, "step": 34869 }, { "epoch": 0.95, "learning_rate": 1.1915004945436848e-07, "loss": 1.3091, "step": 34870 }, { "epoch": 0.95, "learning_rate": 1.1901395430937934e-07, "loss": 1.4211, "step": 34871 }, { "epoch": 0.95, "learning_rate": 1.1887793646857993e-07, "loss": 1.271, "step": 34872 }, { "epoch": 0.95, "learning_rate": 1.187419959330316e-07, "loss": 1.2847, "step": 34873 }, { "epoch": 0.95, "learning_rate": 1.1860613270380016e-07, "loss": 1.1355, "step": 34874 }, { "epoch": 0.95, "learning_rate": 1.1847034678194813e-07, "loss": 1.3911, "step": 34875 }, { "epoch": 0.95, "learning_rate": 1.1833463816853685e-07, "loss": 1.3513, "step": 34876 }, { "epoch": 0.95, "learning_rate": 1.1819900686462882e-07, "loss": 1.2678, "step": 34877 }, { "epoch": 0.95, "learning_rate": 1.180634528712854e-07, "loss": 1.2339, "step": 34878 }, { "epoch": 0.95, "learning_rate": 1.1792797618956575e-07, "loss": 1.2751, "step": 34879 }, { "epoch": 0.95, "learning_rate": 1.1779257682053236e-07, "loss": 1.3025, "step": 34880 }, { "epoch": 0.95, "learning_rate": 1.1765725476524215e-07, "loss": 1.416, "step": 34881 }, { "epoch": 0.95, "learning_rate": 1.1752201002475317e-07, "loss": 1.1057, "step": 34882 }, { "epoch": 0.95, "learning_rate": 1.1738684260012679e-07, "loss": 1.0806, "step": 34883 }, { "epoch": 0.95, "learning_rate": 1.1725175249241772e-07, "loss": 1.1777, "step": 34884 }, { "epoch": 0.95, "learning_rate": 1.17116739702684e-07, "loss": 1.3071, "step": 34885 }, { "epoch": 0.95, "learning_rate": 1.1698180423198146e-07, "loss": 1.3853, "step": 34886 }, { "epoch": 0.95, "learning_rate": 1.1684694608136594e-07, "loss": 1.2917, "step": 34887 }, { "epoch": 0.95, "learning_rate": 1.1671216525189322e-07, "loss": 1.2727, "step": 34888 }, { "epoch": 0.95, "learning_rate": 1.1657746174461693e-07, "loss": 1.3696, "step": 34889 }, { "epoch": 0.95, "learning_rate": 1.1644283556059067e-07, "loss": 1.4236, "step": 34890 }, { "epoch": 0.95, "learning_rate": 1.1630828670086802e-07, "loss": 1.3076, "step": 34891 }, { "epoch": 0.95, "learning_rate": 1.161738151665015e-07, "loss": 0.9452, "step": 34892 }, { "epoch": 0.95, "learning_rate": 1.160394209585447e-07, "loss": 1.1572, "step": 34893 }, { "epoch": 0.95, "learning_rate": 1.1590510407804567e-07, "loss": 1.198, "step": 34894 }, { "epoch": 0.95, "learning_rate": 1.1577086452605801e-07, "loss": 1.2109, "step": 34895 }, { "epoch": 0.95, "learning_rate": 1.1563670230363199e-07, "loss": 1.4121, "step": 34896 }, { "epoch": 0.95, "learning_rate": 1.1550261741181568e-07, "loss": 1.0342, "step": 34897 }, { "epoch": 0.95, "learning_rate": 1.1536860985165933e-07, "loss": 1.259, "step": 34898 }, { "epoch": 0.95, "learning_rate": 1.1523467962420987e-07, "loss": 1.1079, "step": 34899 }, { "epoch": 0.95, "learning_rate": 1.1510082673051759e-07, "loss": 1.3523, "step": 34900 }, { "epoch": 0.95, "learning_rate": 1.149670511716272e-07, "loss": 1.3582, "step": 34901 }, { "epoch": 0.95, "learning_rate": 1.1483335294858677e-07, "loss": 1.2971, "step": 34902 }, { "epoch": 0.95, "learning_rate": 1.1469973206244211e-07, "loss": 1.1716, "step": 34903 }, { "epoch": 0.95, "learning_rate": 1.1456618851423906e-07, "loss": 1.2893, "step": 34904 }, { "epoch": 0.95, "learning_rate": 1.1443272230502011e-07, "loss": 1.2676, "step": 34905 }, { "epoch": 0.95, "learning_rate": 1.142993334358311e-07, "loss": 1.2805, "step": 34906 }, { "epoch": 0.95, "learning_rate": 1.1416602190771565e-07, "loss": 1.2883, "step": 34907 }, { "epoch": 0.95, "learning_rate": 1.1403278772171844e-07, "loss": 1.3145, "step": 34908 }, { "epoch": 0.95, "learning_rate": 1.1389963087887756e-07, "loss": 1.269, "step": 34909 }, { "epoch": 0.95, "learning_rate": 1.1376655138023885e-07, "loss": 1.3716, "step": 34910 }, { "epoch": 0.95, "learning_rate": 1.1363354922684034e-07, "loss": 1.209, "step": 34911 }, { "epoch": 0.95, "learning_rate": 1.1350062441972454e-07, "loss": 1.3831, "step": 34912 }, { "epoch": 0.95, "learning_rate": 1.1336777695993173e-07, "loss": 1.1775, "step": 34913 }, { "epoch": 0.95, "learning_rate": 1.1323500684849886e-07, "loss": 1.2654, "step": 34914 }, { "epoch": 0.95, "learning_rate": 1.1310231408646844e-07, "loss": 1.269, "step": 34915 }, { "epoch": 0.95, "learning_rate": 1.1296969867487517e-07, "loss": 1.2607, "step": 34916 }, { "epoch": 0.95, "learning_rate": 1.1283716061475714e-07, "loss": 1.1124, "step": 34917 }, { "epoch": 0.95, "learning_rate": 1.1270469990715238e-07, "loss": 1.2712, "step": 34918 }, { "epoch": 0.95, "learning_rate": 1.1257231655309674e-07, "loss": 1.3538, "step": 34919 }, { "epoch": 0.95, "learning_rate": 1.1244001055362608e-07, "loss": 1.3022, "step": 34920 }, { "epoch": 0.95, "learning_rate": 1.123077819097762e-07, "loss": 1.3418, "step": 34921 }, { "epoch": 0.95, "learning_rate": 1.1217563062257853e-07, "loss": 1.2903, "step": 34922 }, { "epoch": 0.95, "learning_rate": 1.120435566930711e-07, "loss": 1.1917, "step": 34923 }, { "epoch": 0.95, "learning_rate": 1.1191156012228421e-07, "loss": 1.2744, "step": 34924 }, { "epoch": 0.95, "learning_rate": 1.1177964091125259e-07, "loss": 1.1973, "step": 34925 }, { "epoch": 0.95, "learning_rate": 1.1164779906100542e-07, "loss": 1.3237, "step": 34926 }, { "epoch": 0.95, "learning_rate": 1.1151603457257742e-07, "loss": 1.6555, "step": 34927 }, { "epoch": 0.95, "learning_rate": 1.1138434744699889e-07, "loss": 1.2544, "step": 34928 }, { "epoch": 0.95, "learning_rate": 1.1125273768529677e-07, "loss": 1.3748, "step": 34929 }, { "epoch": 0.95, "learning_rate": 1.1112120528850578e-07, "loss": 1.1729, "step": 34930 }, { "epoch": 0.95, "learning_rate": 1.1098975025765069e-07, "loss": 1.3403, "step": 34931 }, { "epoch": 0.95, "learning_rate": 1.1085837259376287e-07, "loss": 1.3887, "step": 34932 }, { "epoch": 0.95, "learning_rate": 1.1072707229786817e-07, "loss": 1.1436, "step": 34933 }, { "epoch": 0.95, "learning_rate": 1.1059584937099466e-07, "loss": 1.2947, "step": 34934 }, { "epoch": 0.95, "learning_rate": 1.104647038141693e-07, "loss": 1.3843, "step": 34935 }, { "epoch": 0.95, "learning_rate": 1.1033363562841681e-07, "loss": 1.1787, "step": 34936 }, { "epoch": 0.95, "learning_rate": 1.1020264481476417e-07, "loss": 1.1736, "step": 34937 }, { "epoch": 0.95, "learning_rate": 1.10071731374235e-07, "loss": 1.3345, "step": 34938 }, { "epoch": 0.95, "learning_rate": 1.0994089530785513e-07, "loss": 1.0822, "step": 34939 }, { "epoch": 0.95, "learning_rate": 1.0981013661664707e-07, "loss": 1.2595, "step": 34940 }, { "epoch": 0.95, "learning_rate": 1.0967945530163227e-07, "loss": 1.4158, "step": 34941 }, { "epoch": 0.95, "learning_rate": 1.0954885136383542e-07, "loss": 1.3208, "step": 34942 }, { "epoch": 0.95, "learning_rate": 1.0941832480427794e-07, "loss": 1.2507, "step": 34943 }, { "epoch": 0.95, "learning_rate": 1.0928787562398014e-07, "loss": 1.125, "step": 34944 }, { "epoch": 0.95, "learning_rate": 1.091575038239634e-07, "loss": 1.2793, "step": 34945 }, { "epoch": 0.95, "learning_rate": 1.0902720940524692e-07, "loss": 1.2036, "step": 34946 }, { "epoch": 0.95, "learning_rate": 1.0889699236885099e-07, "loss": 1.2991, "step": 34947 }, { "epoch": 0.95, "learning_rate": 1.0876685271579368e-07, "loss": 1.1301, "step": 34948 }, { "epoch": 0.95, "learning_rate": 1.0863679044709308e-07, "loss": 1.2815, "step": 34949 }, { "epoch": 0.95, "learning_rate": 1.0850680556376725e-07, "loss": 1.2751, "step": 34950 }, { "epoch": 0.95, "learning_rate": 1.0837689806683315e-07, "loss": 1.2839, "step": 34951 }, { "epoch": 0.95, "learning_rate": 1.0824706795730555e-07, "loss": 1.2527, "step": 34952 }, { "epoch": 0.95, "learning_rate": 1.0811731523620361e-07, "loss": 1.2651, "step": 34953 }, { "epoch": 0.95, "learning_rate": 1.0798763990453764e-07, "loss": 1.1792, "step": 34954 }, { "epoch": 0.95, "learning_rate": 1.0785804196332794e-07, "loss": 1.425, "step": 34955 }, { "epoch": 0.95, "learning_rate": 1.0772852141358258e-07, "loss": 1.281, "step": 34956 }, { "epoch": 0.95, "learning_rate": 1.0759907825631966e-07, "loss": 1.3428, "step": 34957 }, { "epoch": 0.95, "learning_rate": 1.0746971249254834e-07, "loss": 1.4062, "step": 34958 }, { "epoch": 0.95, "learning_rate": 1.0734042412328227e-07, "loss": 1.2346, "step": 34959 }, { "epoch": 0.95, "learning_rate": 1.0721121314953398e-07, "loss": 1.1763, "step": 34960 }, { "epoch": 0.95, "learning_rate": 1.0708207957231154e-07, "loss": 1.2, "step": 34961 }, { "epoch": 0.95, "learning_rate": 1.0695302339262858e-07, "loss": 1.3582, "step": 34962 }, { "epoch": 0.95, "learning_rate": 1.068240446114921e-07, "loss": 1.425, "step": 34963 }, { "epoch": 0.95, "learning_rate": 1.0669514322991237e-07, "loss": 1.054, "step": 34964 }, { "epoch": 0.95, "learning_rate": 1.0656631924889749e-07, "loss": 1.2295, "step": 34965 }, { "epoch": 0.95, "learning_rate": 1.0643757266945664e-07, "loss": 1.1262, "step": 34966 }, { "epoch": 0.95, "learning_rate": 1.0630890349259571e-07, "loss": 1.1641, "step": 34967 }, { "epoch": 0.95, "learning_rate": 1.0618031171932053e-07, "loss": 1.127, "step": 34968 }, { "epoch": 0.95, "learning_rate": 1.0605179735063808e-07, "loss": 1.3218, "step": 34969 }, { "epoch": 0.96, "learning_rate": 1.0592336038755536e-07, "loss": 1.2048, "step": 34970 }, { "epoch": 0.96, "learning_rate": 1.0579500083107486e-07, "loss": 1.124, "step": 34971 }, { "epoch": 0.96, "learning_rate": 1.0566671868220247e-07, "loss": 1.3313, "step": 34972 }, { "epoch": 0.96, "learning_rate": 1.055385139419396e-07, "loss": 1.1804, "step": 34973 }, { "epoch": 0.96, "learning_rate": 1.05410386611291e-07, "loss": 1.1396, "step": 34974 }, { "epoch": 0.96, "learning_rate": 1.0528233669126031e-07, "loss": 1.3018, "step": 34975 }, { "epoch": 0.96, "learning_rate": 1.0515436418284564e-07, "loss": 1.7896, "step": 34976 }, { "epoch": 0.96, "learning_rate": 1.0502646908705172e-07, "loss": 1.179, "step": 34977 }, { "epoch": 0.96, "learning_rate": 1.0489865140487776e-07, "loss": 1.3218, "step": 34978 }, { "epoch": 0.96, "learning_rate": 1.0477091113732297e-07, "loss": 1.2161, "step": 34979 }, { "epoch": 0.96, "learning_rate": 1.0464324828538763e-07, "loss": 1.2935, "step": 34980 }, { "epoch": 0.96, "learning_rate": 1.0451566285007098e-07, "loss": 1.0027, "step": 34981 }, { "epoch": 0.96, "learning_rate": 1.0438815483237108e-07, "loss": 1.2217, "step": 34982 }, { "epoch": 0.96, "learning_rate": 1.0426072423328382e-07, "loss": 1.2786, "step": 34983 }, { "epoch": 0.96, "learning_rate": 1.0413337105380727e-07, "loss": 1.1655, "step": 34984 }, { "epoch": 0.96, "learning_rate": 1.0400609529493843e-07, "loss": 1.1819, "step": 34985 }, { "epoch": 0.96, "learning_rate": 1.0387889695767316e-07, "loss": 1.3457, "step": 34986 }, { "epoch": 0.96, "learning_rate": 1.0375177604300513e-07, "loss": 1.2629, "step": 34987 }, { "epoch": 0.96, "learning_rate": 1.0362473255192906e-07, "loss": 1.3118, "step": 34988 }, { "epoch": 0.96, "learning_rate": 1.0349776648543975e-07, "loss": 1.2603, "step": 34989 }, { "epoch": 0.96, "learning_rate": 1.0337087784453192e-07, "loss": 1.3186, "step": 34990 }, { "epoch": 0.96, "learning_rate": 1.0324406663019481e-07, "loss": 1.2917, "step": 34991 }, { "epoch": 0.96, "learning_rate": 1.0311733284342318e-07, "loss": 1.1948, "step": 34992 }, { "epoch": 0.96, "learning_rate": 1.0299067648520622e-07, "loss": 1.2773, "step": 34993 }, { "epoch": 0.96, "learning_rate": 1.028640975565387e-07, "loss": 1.1969, "step": 34994 }, { "epoch": 0.96, "learning_rate": 1.027375960584065e-07, "loss": 1.4507, "step": 34995 }, { "epoch": 0.96, "learning_rate": 1.0261117199180326e-07, "loss": 1.3401, "step": 34996 }, { "epoch": 0.96, "learning_rate": 1.0248482535771376e-07, "loss": 1.1313, "step": 34997 }, { "epoch": 0.96, "learning_rate": 1.0235855615713164e-07, "loss": 1.2529, "step": 34998 }, { "epoch": 0.96, "learning_rate": 1.0223236439103945e-07, "loss": 1.2896, "step": 34999 }, { "epoch": 0.96, "learning_rate": 1.0210625006042862e-07, "loss": 1.0099, "step": 35000 }, { "epoch": 0.96, "learning_rate": 1.0198021316628282e-07, "loss": 1.3, "step": 35001 }, { "epoch": 0.96, "learning_rate": 1.0185425370959012e-07, "loss": 1.1349, "step": 35002 }, { "epoch": 0.96, "learning_rate": 1.0172837169133531e-07, "loss": 1.2349, "step": 35003 }, { "epoch": 0.96, "learning_rate": 1.0160256711250316e-07, "loss": 1.3044, "step": 35004 }, { "epoch": 0.96, "learning_rate": 1.0147683997407843e-07, "loss": 1.2578, "step": 35005 }, { "epoch": 0.96, "learning_rate": 1.0135119027704365e-07, "loss": 1.3643, "step": 35006 }, { "epoch": 0.96, "learning_rate": 1.0122561802238251e-07, "loss": 1.2148, "step": 35007 }, { "epoch": 0.96, "learning_rate": 1.0110012321107753e-07, "loss": 1.2292, "step": 35008 }, { "epoch": 0.96, "learning_rate": 1.0097470584411128e-07, "loss": 1.1663, "step": 35009 }, { "epoch": 0.96, "learning_rate": 1.0084936592246297e-07, "loss": 1.2102, "step": 35010 }, { "epoch": 0.96, "learning_rate": 1.0072410344711514e-07, "loss": 1.0967, "step": 35011 }, { "epoch": 0.96, "learning_rate": 1.0059891841904589e-07, "loss": 1.343, "step": 35012 }, { "epoch": 0.96, "learning_rate": 1.0047381083923669e-07, "loss": 1.3352, "step": 35013 }, { "epoch": 0.96, "learning_rate": 1.003487807086645e-07, "loss": 1.1597, "step": 35014 }, { "epoch": 0.96, "learning_rate": 1.0022382802830854e-07, "loss": 1.3274, "step": 35015 }, { "epoch": 0.96, "learning_rate": 1.0009895279914583e-07, "loss": 1.4961, "step": 35016 }, { "epoch": 0.96, "learning_rate": 9.997415502215446e-08, "loss": 1.3596, "step": 35017 }, { "epoch": 0.96, "learning_rate": 9.984943469831032e-08, "loss": 1.1558, "step": 35018 }, { "epoch": 0.96, "learning_rate": 9.972479182858818e-08, "loss": 1.2288, "step": 35019 }, { "epoch": 0.96, "learning_rate": 9.960022641396283e-08, "loss": 1.2876, "step": 35020 }, { "epoch": 0.96, "learning_rate": 9.947573845541125e-08, "loss": 1.1565, "step": 35021 }, { "epoch": 0.96, "learning_rate": 9.9351327953906e-08, "loss": 1.2107, "step": 35022 }, { "epoch": 0.96, "learning_rate": 9.922699491041965e-08, "loss": 1.2058, "step": 35023 }, { "epoch": 0.96, "learning_rate": 9.910273932592584e-08, "loss": 1.24, "step": 35024 }, { "epoch": 0.96, "learning_rate": 9.897856120139604e-08, "loss": 1.2498, "step": 35025 }, { "epoch": 0.96, "learning_rate": 9.885446053780279e-08, "loss": 1.2427, "step": 35026 }, { "epoch": 0.96, "learning_rate": 9.873043733611642e-08, "loss": 1.3142, "step": 35027 }, { "epoch": 0.96, "learning_rate": 9.860649159730618e-08, "loss": 1.2754, "step": 35028 }, { "epoch": 0.96, "learning_rate": 9.84826233223446e-08, "loss": 1.2649, "step": 35029 }, { "epoch": 0.96, "learning_rate": 9.835883251219758e-08, "loss": 1.3127, "step": 35030 }, { "epoch": 0.96, "learning_rate": 9.823511916783546e-08, "loss": 1.2903, "step": 35031 }, { "epoch": 0.96, "learning_rate": 9.811148329022524e-08, "loss": 1.2046, "step": 35032 }, { "epoch": 0.96, "learning_rate": 9.798792488033393e-08, "loss": 1.2595, "step": 35033 }, { "epoch": 0.96, "learning_rate": 9.786444393913075e-08, "loss": 1.2324, "step": 35034 }, { "epoch": 0.96, "learning_rate": 9.774104046757827e-08, "loss": 1.1077, "step": 35035 }, { "epoch": 0.96, "learning_rate": 9.761771446664348e-08, "loss": 1.2991, "step": 35036 }, { "epoch": 0.96, "learning_rate": 9.749446593729228e-08, "loss": 1.3708, "step": 35037 }, { "epoch": 0.96, "learning_rate": 9.737129488048835e-08, "loss": 1.188, "step": 35038 }, { "epoch": 0.96, "learning_rate": 9.724820129719314e-08, "loss": 1.1365, "step": 35039 }, { "epoch": 0.96, "learning_rate": 9.712518518837254e-08, "loss": 1.1545, "step": 35040 }, { "epoch": 0.96, "learning_rate": 9.700224655498802e-08, "loss": 1.3945, "step": 35041 }, { "epoch": 0.96, "learning_rate": 9.687938539799991e-08, "loss": 1.2732, "step": 35042 }, { "epoch": 0.96, "learning_rate": 9.675660171837186e-08, "loss": 1.3936, "step": 35043 }, { "epoch": 0.96, "learning_rate": 9.663389551706314e-08, "loss": 1.2373, "step": 35044 }, { "epoch": 0.96, "learning_rate": 9.651126679503409e-08, "loss": 1.0713, "step": 35045 }, { "epoch": 0.96, "learning_rate": 9.638871555324391e-08, "loss": 1.1531, "step": 35046 }, { "epoch": 0.96, "learning_rate": 9.626624179265076e-08, "loss": 1.1008, "step": 35047 }, { "epoch": 0.96, "learning_rate": 9.614384551421385e-08, "loss": 1.2991, "step": 35048 }, { "epoch": 0.96, "learning_rate": 9.60215267188902e-08, "loss": 1.2634, "step": 35049 }, { "epoch": 0.96, "learning_rate": 9.589928540763682e-08, "loss": 1.2954, "step": 35050 }, { "epoch": 0.96, "learning_rate": 9.577712158141072e-08, "loss": 1.1965, "step": 35051 }, { "epoch": 0.96, "learning_rate": 9.56550352411667e-08, "loss": 1.176, "step": 35052 }, { "epoch": 0.96, "learning_rate": 9.553302638786066e-08, "loss": 1.2427, "step": 35053 }, { "epoch": 0.96, "learning_rate": 9.541109502244739e-08, "loss": 1.3025, "step": 35054 }, { "epoch": 0.96, "learning_rate": 9.528924114587834e-08, "loss": 1.2842, "step": 35055 }, { "epoch": 0.96, "learning_rate": 9.516746475911054e-08, "loss": 1.3599, "step": 35056 }, { "epoch": 0.96, "learning_rate": 9.504576586309433e-08, "loss": 1.3989, "step": 35057 }, { "epoch": 0.96, "learning_rate": 9.49241444587834e-08, "loss": 1.2588, "step": 35058 }, { "epoch": 0.96, "learning_rate": 9.480260054712587e-08, "loss": 1.2014, "step": 35059 }, { "epoch": 0.96, "learning_rate": 9.468113412907764e-08, "loss": 1.4856, "step": 35060 }, { "epoch": 0.96, "learning_rate": 9.455974520558465e-08, "loss": 1.1272, "step": 35061 }, { "epoch": 0.96, "learning_rate": 9.443843377759943e-08, "loss": 1.1064, "step": 35062 }, { "epoch": 0.96, "learning_rate": 9.431719984606901e-08, "loss": 1.2424, "step": 35063 }, { "epoch": 0.96, "learning_rate": 9.419604341194377e-08, "loss": 1.3169, "step": 35064 }, { "epoch": 0.96, "learning_rate": 9.407496447616959e-08, "loss": 1.2681, "step": 35065 }, { "epoch": 0.96, "learning_rate": 9.395396303969573e-08, "loss": 1.1755, "step": 35066 }, { "epoch": 0.96, "learning_rate": 9.383303910346697e-08, "loss": 1.4111, "step": 35067 }, { "epoch": 0.96, "learning_rate": 9.371219266843145e-08, "loss": 1.4048, "step": 35068 }, { "epoch": 0.96, "learning_rate": 9.359142373553287e-08, "loss": 1.1919, "step": 35069 }, { "epoch": 0.96, "learning_rate": 9.347073230571712e-08, "loss": 1.2239, "step": 35070 }, { "epoch": 0.96, "learning_rate": 9.33501183799268e-08, "loss": 1.2781, "step": 35071 }, { "epoch": 0.96, "learning_rate": 9.32295819591078e-08, "loss": 1.2463, "step": 35072 }, { "epoch": 0.96, "learning_rate": 9.310912304420272e-08, "loss": 1.2529, "step": 35073 }, { "epoch": 0.96, "learning_rate": 9.29887416361519e-08, "loss": 1.092, "step": 35074 }, { "epoch": 0.96, "learning_rate": 9.286843773589904e-08, "loss": 1.2563, "step": 35075 }, { "epoch": 0.96, "learning_rate": 9.27482113443845e-08, "loss": 1.2817, "step": 35076 }, { "epoch": 0.96, "learning_rate": 9.262806246254974e-08, "loss": 1.2493, "step": 35077 }, { "epoch": 0.96, "learning_rate": 9.250799109133402e-08, "loss": 1.2197, "step": 35078 }, { "epoch": 0.96, "learning_rate": 9.238799723167657e-08, "loss": 1.2393, "step": 35079 }, { "epoch": 0.96, "learning_rate": 9.226808088451666e-08, "loss": 1.2903, "step": 35080 }, { "epoch": 0.96, "learning_rate": 9.214824205079354e-08, "loss": 1.2168, "step": 35081 }, { "epoch": 0.96, "learning_rate": 9.20284807314431e-08, "loss": 1.6792, "step": 35082 }, { "epoch": 0.96, "learning_rate": 9.190879692740129e-08, "loss": 1.3198, "step": 35083 }, { "epoch": 0.96, "learning_rate": 9.178919063960734e-08, "loss": 1.1121, "step": 35084 }, { "epoch": 0.96, "learning_rate": 9.166966186899495e-08, "loss": 1.157, "step": 35085 }, { "epoch": 0.96, "learning_rate": 9.155021061650115e-08, "loss": 1.3645, "step": 35086 }, { "epoch": 0.96, "learning_rate": 9.143083688305742e-08, "loss": 1.3606, "step": 35087 }, { "epoch": 0.96, "learning_rate": 9.131154066960079e-08, "loss": 1.1279, "step": 35088 }, { "epoch": 0.96, "learning_rate": 9.119232197706274e-08, "loss": 1.0869, "step": 35089 }, { "epoch": 0.96, "learning_rate": 9.107318080637694e-08, "loss": 1.3237, "step": 35090 }, { "epoch": 0.96, "learning_rate": 9.095411715847491e-08, "loss": 1.283, "step": 35091 }, { "epoch": 0.96, "learning_rate": 9.08351310342881e-08, "loss": 1.25, "step": 35092 }, { "epoch": 0.96, "learning_rate": 9.071622243474799e-08, "loss": 1.1843, "step": 35093 }, { "epoch": 0.96, "learning_rate": 9.059739136078383e-08, "loss": 1.2986, "step": 35094 }, { "epoch": 0.96, "learning_rate": 9.047863781332599e-08, "loss": 1.3877, "step": 35095 }, { "epoch": 0.96, "learning_rate": 9.035996179330376e-08, "loss": 1.2419, "step": 35096 }, { "epoch": 0.96, "learning_rate": 9.024136330164524e-08, "loss": 1.2864, "step": 35097 }, { "epoch": 0.96, "learning_rate": 9.01228423392786e-08, "loss": 1.1641, "step": 35098 }, { "epoch": 0.96, "learning_rate": 9.000439890713087e-08, "loss": 1.3037, "step": 35099 }, { "epoch": 0.96, "learning_rate": 8.988603300612908e-08, "loss": 1.3171, "step": 35100 }, { "epoch": 0.96, "learning_rate": 8.976774463719806e-08, "loss": 1.2815, "step": 35101 }, { "epoch": 0.96, "learning_rate": 8.964953380126484e-08, "loss": 1.2358, "step": 35102 }, { "epoch": 0.96, "learning_rate": 8.953140049925314e-08, "loss": 1.251, "step": 35103 }, { "epoch": 0.96, "learning_rate": 8.941334473208774e-08, "loss": 1.3125, "step": 35104 }, { "epoch": 0.96, "learning_rate": 8.929536650069237e-08, "loss": 1.7256, "step": 35105 }, { "epoch": 0.96, "learning_rate": 8.917746580598852e-08, "loss": 1.3613, "step": 35106 }, { "epoch": 0.96, "learning_rate": 8.905964264890099e-08, "loss": 1.3167, "step": 35107 }, { "epoch": 0.96, "learning_rate": 8.894189703034906e-08, "loss": 1.196, "step": 35108 }, { "epoch": 0.96, "learning_rate": 8.882422895125642e-08, "loss": 1.2219, "step": 35109 }, { "epoch": 0.96, "learning_rate": 8.870663841254234e-08, "loss": 1.1848, "step": 35110 }, { "epoch": 0.96, "learning_rate": 8.85891254151261e-08, "loss": 1.3206, "step": 35111 }, { "epoch": 0.96, "learning_rate": 8.847168995992916e-08, "loss": 1.3081, "step": 35112 }, { "epoch": 0.96, "learning_rate": 8.835433204786747e-08, "loss": 1.1753, "step": 35113 }, { "epoch": 0.96, "learning_rate": 8.823705167986141e-08, "loss": 1.1112, "step": 35114 }, { "epoch": 0.96, "learning_rate": 8.8119848856828e-08, "loss": 1.1765, "step": 35115 }, { "epoch": 0.96, "learning_rate": 8.800272357968431e-08, "loss": 1.2581, "step": 35116 }, { "epoch": 0.96, "learning_rate": 8.788567584934516e-08, "loss": 1.2295, "step": 35117 }, { "epoch": 0.96, "learning_rate": 8.776870566672868e-08, "loss": 1.0944, "step": 35118 }, { "epoch": 0.96, "learning_rate": 8.76518130327475e-08, "loss": 1.405, "step": 35119 }, { "epoch": 0.96, "learning_rate": 8.753499794831977e-08, "loss": 1.3521, "step": 35120 }, { "epoch": 0.96, "learning_rate": 8.741826041435475e-08, "loss": 1.2148, "step": 35121 }, { "epoch": 0.96, "learning_rate": 8.730160043176839e-08, "loss": 1.2214, "step": 35122 }, { "epoch": 0.96, "learning_rate": 8.718501800147328e-08, "loss": 1.4116, "step": 35123 }, { "epoch": 0.96, "learning_rate": 8.706851312438203e-08, "loss": 1.1228, "step": 35124 }, { "epoch": 0.96, "learning_rate": 8.695208580140502e-08, "loss": 1.165, "step": 35125 }, { "epoch": 0.96, "learning_rate": 8.683573603345263e-08, "loss": 1.2791, "step": 35126 }, { "epoch": 0.96, "learning_rate": 8.671946382143636e-08, "loss": 1.2678, "step": 35127 }, { "epoch": 0.96, "learning_rate": 8.66032691662666e-08, "loss": 1.1909, "step": 35128 }, { "epoch": 0.96, "learning_rate": 8.648715206884928e-08, "loss": 1.2717, "step": 35129 }, { "epoch": 0.96, "learning_rate": 8.637111253009589e-08, "loss": 1.0967, "step": 35130 }, { "epoch": 0.96, "learning_rate": 8.625515055091349e-08, "loss": 1.1917, "step": 35131 }, { "epoch": 0.96, "learning_rate": 8.613926613220803e-08, "loss": 1.3291, "step": 35132 }, { "epoch": 0.96, "learning_rate": 8.602345927488764e-08, "loss": 1.2207, "step": 35133 }, { "epoch": 0.96, "learning_rate": 8.59077299798583e-08, "loss": 1.2751, "step": 35134 }, { "epoch": 0.96, "learning_rate": 8.579207824802482e-08, "loss": 1.2212, "step": 35135 }, { "epoch": 0.96, "learning_rate": 8.567650408029205e-08, "loss": 1.0862, "step": 35136 }, { "epoch": 0.96, "learning_rate": 8.556100747756368e-08, "loss": 1.2576, "step": 35137 }, { "epoch": 0.96, "learning_rate": 8.544558844074347e-08, "loss": 1.28, "step": 35138 }, { "epoch": 0.96, "learning_rate": 8.533024697073622e-08, "loss": 1.2556, "step": 35139 }, { "epoch": 0.96, "learning_rate": 8.521498306844233e-08, "loss": 1.1536, "step": 35140 }, { "epoch": 0.96, "learning_rate": 8.509979673476442e-08, "loss": 1.196, "step": 35141 }, { "epoch": 0.96, "learning_rate": 8.498468797060288e-08, "loss": 1.1802, "step": 35142 }, { "epoch": 0.96, "learning_rate": 8.486965677685921e-08, "loss": 1.1855, "step": 35143 }, { "epoch": 0.96, "learning_rate": 8.475470315443268e-08, "loss": 1.3318, "step": 35144 }, { "epoch": 0.96, "learning_rate": 8.463982710422258e-08, "loss": 1.2034, "step": 35145 }, { "epoch": 0.96, "learning_rate": 8.452502862712819e-08, "loss": 1.2622, "step": 35146 }, { "epoch": 0.96, "learning_rate": 8.441030772404768e-08, "loss": 1.3181, "step": 35147 }, { "epoch": 0.96, "learning_rate": 8.429566439587811e-08, "loss": 1.2915, "step": 35148 }, { "epoch": 0.96, "learning_rate": 8.418109864351653e-08, "loss": 1.3843, "step": 35149 }, { "epoch": 0.96, "learning_rate": 8.406661046786002e-08, "loss": 1.2344, "step": 35150 }, { "epoch": 0.96, "learning_rate": 8.39521998698023e-08, "loss": 1.2366, "step": 35151 }, { "epoch": 0.96, "learning_rate": 8.383786685024043e-08, "loss": 1.3398, "step": 35152 }, { "epoch": 0.96, "learning_rate": 8.372361141006813e-08, "loss": 1.3328, "step": 35153 }, { "epoch": 0.96, "learning_rate": 8.360943355017915e-08, "loss": 1.1079, "step": 35154 }, { "epoch": 0.96, "learning_rate": 8.349533327146719e-08, "loss": 1.2727, "step": 35155 }, { "epoch": 0.96, "learning_rate": 8.33813105748249e-08, "loss": 1.186, "step": 35156 }, { "epoch": 0.96, "learning_rate": 8.326736546114267e-08, "loss": 1.1477, "step": 35157 }, { "epoch": 0.96, "learning_rate": 8.315349793131421e-08, "loss": 1.3066, "step": 35158 }, { "epoch": 0.96, "learning_rate": 8.303970798622995e-08, "loss": 1.312, "step": 35159 }, { "epoch": 0.96, "learning_rate": 8.292599562677916e-08, "loss": 1.177, "step": 35160 }, { "epoch": 0.96, "learning_rate": 8.281236085385336e-08, "loss": 1.3274, "step": 35161 }, { "epoch": 0.96, "learning_rate": 8.269880366833849e-08, "loss": 1.2166, "step": 35162 }, { "epoch": 0.96, "learning_rate": 8.258532407112608e-08, "loss": 1.1616, "step": 35163 }, { "epoch": 0.96, "learning_rate": 8.247192206310206e-08, "loss": 1.2192, "step": 35164 }, { "epoch": 0.96, "learning_rate": 8.235859764515463e-08, "loss": 1.2773, "step": 35165 }, { "epoch": 0.96, "learning_rate": 8.224535081816865e-08, "loss": 1.2856, "step": 35166 }, { "epoch": 0.96, "learning_rate": 8.213218158303338e-08, "loss": 1.0425, "step": 35167 }, { "epoch": 0.96, "learning_rate": 8.201908994063035e-08, "loss": 1.241, "step": 35168 }, { "epoch": 0.96, "learning_rate": 8.190607589184774e-08, "loss": 1.4258, "step": 35169 }, { "epoch": 0.96, "learning_rate": 8.179313943756705e-08, "loss": 1.1421, "step": 35170 }, { "epoch": 0.96, "learning_rate": 8.168028057867316e-08, "loss": 1.3074, "step": 35171 }, { "epoch": 0.96, "learning_rate": 8.156749931604868e-08, "loss": 1.2778, "step": 35172 }, { "epoch": 0.96, "learning_rate": 8.145479565057735e-08, "loss": 1.2183, "step": 35173 }, { "epoch": 0.96, "learning_rate": 8.134216958313734e-08, "loss": 1.282, "step": 35174 }, { "epoch": 0.96, "learning_rate": 8.122962111461352e-08, "loss": 1.3628, "step": 35175 }, { "epoch": 0.96, "learning_rate": 8.111715024588518e-08, "loss": 1.3245, "step": 35176 }, { "epoch": 0.96, "learning_rate": 8.100475697783161e-08, "loss": 1.2444, "step": 35177 }, { "epoch": 0.96, "learning_rate": 8.089244131133323e-08, "loss": 1.2507, "step": 35178 }, { "epoch": 0.96, "learning_rate": 8.078020324726821e-08, "loss": 1.3108, "step": 35179 }, { "epoch": 0.96, "learning_rate": 8.066804278651363e-08, "loss": 1.3184, "step": 35180 }, { "epoch": 0.96, "learning_rate": 8.055595992994769e-08, "loss": 1.2908, "step": 35181 }, { "epoch": 0.96, "learning_rate": 8.044395467844857e-08, "loss": 1.2205, "step": 35182 }, { "epoch": 0.96, "learning_rate": 8.033202703289111e-08, "loss": 1.2778, "step": 35183 }, { "epoch": 0.96, "learning_rate": 8.02201769941513e-08, "loss": 1.2087, "step": 35184 }, { "epoch": 0.96, "learning_rate": 8.010840456310398e-08, "loss": 1.2178, "step": 35185 }, { "epoch": 0.96, "learning_rate": 7.999670974062401e-08, "loss": 1.1997, "step": 35186 }, { "epoch": 0.96, "learning_rate": 7.988509252758514e-08, "loss": 1.1681, "step": 35187 }, { "epoch": 0.96, "learning_rate": 7.977355292486e-08, "loss": 1.333, "step": 35188 }, { "epoch": 0.96, "learning_rate": 7.966209093332234e-08, "loss": 1.2913, "step": 35189 }, { "epoch": 0.96, "learning_rate": 7.955070655384368e-08, "loss": 1.1472, "step": 35190 }, { "epoch": 0.96, "learning_rate": 7.943939978729553e-08, "loss": 1.3159, "step": 35191 }, { "epoch": 0.96, "learning_rate": 7.932817063454723e-08, "loss": 1.3535, "step": 35192 }, { "epoch": 0.96, "learning_rate": 7.921701909647139e-08, "loss": 1.1832, "step": 35193 }, { "epoch": 0.96, "learning_rate": 7.910594517393621e-08, "loss": 1.2197, "step": 35194 }, { "epoch": 0.96, "learning_rate": 7.8994948867811e-08, "loss": 1.2615, "step": 35195 }, { "epoch": 0.96, "learning_rate": 7.888403017896395e-08, "loss": 1.2422, "step": 35196 }, { "epoch": 0.96, "learning_rate": 7.877318910826326e-08, "loss": 1.2444, "step": 35197 }, { "epoch": 0.96, "learning_rate": 7.8662425656576e-08, "loss": 1.4438, "step": 35198 }, { "epoch": 0.96, "learning_rate": 7.855173982476926e-08, "loss": 1.3997, "step": 35199 }, { "epoch": 0.96, "learning_rate": 7.844113161370681e-08, "loss": 1.2512, "step": 35200 }, { "epoch": 0.96, "learning_rate": 7.833060102425682e-08, "loss": 1.2834, "step": 35201 }, { "epoch": 0.96, "learning_rate": 7.822014805728196e-08, "loss": 1.3235, "step": 35202 }, { "epoch": 0.96, "learning_rate": 7.810977271364705e-08, "loss": 1.1897, "step": 35203 }, { "epoch": 0.96, "learning_rate": 7.79994749942159e-08, "loss": 1.3315, "step": 35204 }, { "epoch": 0.96, "learning_rate": 7.78892548998511e-08, "loss": 1.4067, "step": 35205 }, { "epoch": 0.96, "learning_rate": 7.777911243141534e-08, "loss": 1.3394, "step": 35206 }, { "epoch": 0.96, "learning_rate": 7.766904758976901e-08, "loss": 1.324, "step": 35207 }, { "epoch": 0.96, "learning_rate": 7.755906037577588e-08, "loss": 1.283, "step": 35208 }, { "epoch": 0.96, "learning_rate": 7.744915079029302e-08, "loss": 1.2119, "step": 35209 }, { "epoch": 0.96, "learning_rate": 7.733931883418422e-08, "loss": 1.3726, "step": 35210 }, { "epoch": 0.96, "learning_rate": 7.722956450830543e-08, "loss": 1.175, "step": 35211 }, { "epoch": 0.96, "learning_rate": 7.711988781351598e-08, "loss": 1.3462, "step": 35212 }, { "epoch": 0.96, "learning_rate": 7.701028875067518e-08, "loss": 1.0955, "step": 35213 }, { "epoch": 0.96, "learning_rate": 7.690076732064011e-08, "loss": 1.2734, "step": 35214 }, { "epoch": 0.96, "learning_rate": 7.679132352426676e-08, "loss": 1.2588, "step": 35215 }, { "epoch": 0.96, "learning_rate": 7.668195736241113e-08, "loss": 1.3101, "step": 35216 }, { "epoch": 0.96, "learning_rate": 7.657266883593028e-08, "loss": 1.365, "step": 35217 }, { "epoch": 0.96, "learning_rate": 7.646345794567911e-08, "loss": 1.3975, "step": 35218 }, { "epoch": 0.96, "learning_rate": 7.635432469251137e-08, "loss": 1.2109, "step": 35219 }, { "epoch": 0.96, "learning_rate": 7.624526907727969e-08, "loss": 1.2419, "step": 35220 }, { "epoch": 0.96, "learning_rate": 7.613629110084009e-08, "loss": 1.3796, "step": 35221 }, { "epoch": 0.96, "learning_rate": 7.602739076404297e-08, "loss": 1.3362, "step": 35222 }, { "epoch": 0.96, "learning_rate": 7.591856806774101e-08, "loss": 1.2114, "step": 35223 }, { "epoch": 0.96, "learning_rate": 7.580982301278461e-08, "loss": 1.4045, "step": 35224 }, { "epoch": 0.96, "learning_rate": 7.570115560002644e-08, "loss": 1.1331, "step": 35225 }, { "epoch": 0.96, "learning_rate": 7.559256583031582e-08, "loss": 1.199, "step": 35226 }, { "epoch": 0.96, "learning_rate": 7.548405370450207e-08, "loss": 1.3472, "step": 35227 }, { "epoch": 0.96, "learning_rate": 7.53756192234345e-08, "loss": 1.3069, "step": 35228 }, { "epoch": 0.96, "learning_rate": 7.526726238796023e-08, "loss": 1.2476, "step": 35229 }, { "epoch": 0.96, "learning_rate": 7.515898319892856e-08, "loss": 1.2449, "step": 35230 }, { "epoch": 0.96, "learning_rate": 7.50507816571866e-08, "loss": 1.3774, "step": 35231 }, { "epoch": 0.96, "learning_rate": 7.494265776357924e-08, "loss": 1.2637, "step": 35232 }, { "epoch": 0.96, "learning_rate": 7.483461151895465e-08, "loss": 1.2917, "step": 35233 }, { "epoch": 0.96, "learning_rate": 7.472664292415555e-08, "loss": 1.2864, "step": 35234 }, { "epoch": 0.96, "learning_rate": 7.461875198002899e-08, "loss": 1.2976, "step": 35235 }, { "epoch": 0.96, "learning_rate": 7.451093868741766e-08, "loss": 1.3496, "step": 35236 }, { "epoch": 0.96, "learning_rate": 7.440320304716531e-08, "loss": 1.4817, "step": 35237 }, { "epoch": 0.96, "learning_rate": 7.429554506011571e-08, "loss": 1.3025, "step": 35238 }, { "epoch": 0.96, "learning_rate": 7.418796472710931e-08, "loss": 1.2971, "step": 35239 }, { "epoch": 0.96, "learning_rate": 7.408046204898878e-08, "loss": 1.2678, "step": 35240 }, { "epoch": 0.96, "learning_rate": 7.397303702659675e-08, "loss": 1.1362, "step": 35241 }, { "epoch": 0.96, "learning_rate": 7.386568966077145e-08, "loss": 1.4087, "step": 35242 }, { "epoch": 0.96, "learning_rate": 7.375841995235222e-08, "loss": 1.1744, "step": 35243 }, { "epoch": 0.96, "learning_rate": 7.36512279021806e-08, "loss": 1.2122, "step": 35244 }, { "epoch": 0.96, "learning_rate": 7.35441135110937e-08, "loss": 1.1321, "step": 35245 }, { "epoch": 0.96, "learning_rate": 7.343707677993083e-08, "loss": 1.2329, "step": 35246 }, { "epoch": 0.96, "learning_rate": 7.333011770952691e-08, "loss": 1.3188, "step": 35247 }, { "epoch": 0.96, "learning_rate": 7.322323630072126e-08, "loss": 1.1914, "step": 35248 }, { "epoch": 0.96, "learning_rate": 7.311643255434874e-08, "loss": 1.3103, "step": 35249 }, { "epoch": 0.96, "learning_rate": 7.300970647124539e-08, "loss": 1.3618, "step": 35250 }, { "epoch": 0.96, "learning_rate": 7.290305805224606e-08, "loss": 1.2507, "step": 35251 }, { "epoch": 0.96, "learning_rate": 7.279648729818567e-08, "loss": 1.1196, "step": 35252 }, { "epoch": 0.96, "learning_rate": 7.268999420989686e-08, "loss": 1.3911, "step": 35253 }, { "epoch": 0.96, "learning_rate": 7.258357878821343e-08, "loss": 1.3823, "step": 35254 }, { "epoch": 0.96, "learning_rate": 7.247724103396803e-08, "loss": 1.2866, "step": 35255 }, { "epoch": 0.96, "learning_rate": 7.237098094799222e-08, "loss": 1.2498, "step": 35256 }, { "epoch": 0.96, "learning_rate": 7.226479853111867e-08, "loss": 1.4163, "step": 35257 }, { "epoch": 0.96, "learning_rate": 7.215869378417561e-08, "loss": 1.3464, "step": 35258 }, { "epoch": 0.96, "learning_rate": 7.205266670799571e-08, "loss": 1.3081, "step": 35259 }, { "epoch": 0.96, "learning_rate": 7.194671730340607e-08, "loss": 1.3015, "step": 35260 }, { "epoch": 0.96, "learning_rate": 7.184084557123827e-08, "loss": 1.2224, "step": 35261 }, { "epoch": 0.96, "learning_rate": 7.173505151231718e-08, "loss": 1.3198, "step": 35262 }, { "epoch": 0.96, "learning_rate": 7.162933512747439e-08, "loss": 1.3616, "step": 35263 }, { "epoch": 0.96, "learning_rate": 7.152369641753365e-08, "loss": 1.3076, "step": 35264 }, { "epoch": 0.96, "learning_rate": 7.141813538332321e-08, "loss": 1.2253, "step": 35265 }, { "epoch": 0.96, "learning_rate": 7.131265202566906e-08, "loss": 1.4834, "step": 35266 }, { "epoch": 0.96, "learning_rate": 7.1207246345395e-08, "loss": 1.342, "step": 35267 }, { "epoch": 0.96, "learning_rate": 7.110191834332702e-08, "loss": 1.2244, "step": 35268 }, { "epoch": 0.96, "learning_rate": 7.099666802028892e-08, "loss": 1.249, "step": 35269 }, { "epoch": 0.96, "learning_rate": 7.089149537710449e-08, "loss": 1.1597, "step": 35270 }, { "epoch": 0.96, "learning_rate": 7.078640041459416e-08, "loss": 1.2952, "step": 35271 }, { "epoch": 0.96, "learning_rate": 7.068138313358397e-08, "loss": 1.2556, "step": 35272 }, { "epoch": 0.96, "learning_rate": 7.057644353489212e-08, "loss": 1.3064, "step": 35273 }, { "epoch": 0.96, "learning_rate": 7.047158161934242e-08, "loss": 1.2207, "step": 35274 }, { "epoch": 0.96, "learning_rate": 7.036679738775309e-08, "loss": 1.1335, "step": 35275 }, { "epoch": 0.96, "learning_rate": 7.02620908409446e-08, "loss": 1.4062, "step": 35276 }, { "epoch": 0.96, "learning_rate": 7.015746197973628e-08, "loss": 1.3621, "step": 35277 }, { "epoch": 0.96, "learning_rate": 7.005291080494747e-08, "loss": 1.2727, "step": 35278 }, { "epoch": 0.96, "learning_rate": 6.994843731739309e-08, "loss": 1.252, "step": 35279 }, { "epoch": 0.96, "learning_rate": 6.98440415178947e-08, "loss": 1.0876, "step": 35280 }, { "epoch": 0.96, "learning_rate": 6.973972340726721e-08, "loss": 1.1206, "step": 35281 }, { "epoch": 0.96, "learning_rate": 6.963548298632549e-08, "loss": 1.2942, "step": 35282 }, { "epoch": 0.96, "learning_rate": 6.953132025588672e-08, "loss": 1.3635, "step": 35283 }, { "epoch": 0.96, "learning_rate": 6.942723521676465e-08, "loss": 1.2913, "step": 35284 }, { "epoch": 0.96, "learning_rate": 6.93232278697753e-08, "loss": 1.1146, "step": 35285 }, { "epoch": 0.96, "learning_rate": 6.921929821573025e-08, "loss": 1.323, "step": 35286 }, { "epoch": 0.96, "learning_rate": 6.911544625544331e-08, "loss": 1.3491, "step": 35287 }, { "epoch": 0.96, "learning_rate": 6.901167198972824e-08, "loss": 1.2092, "step": 35288 }, { "epoch": 0.96, "learning_rate": 6.890797541939665e-08, "loss": 1.2003, "step": 35289 }, { "epoch": 0.96, "learning_rate": 6.880435654525785e-08, "loss": 1.2463, "step": 35290 }, { "epoch": 0.96, "learning_rate": 6.870081536812345e-08, "loss": 1.1863, "step": 35291 }, { "epoch": 0.96, "learning_rate": 6.8597351888805e-08, "loss": 1.2622, "step": 35292 }, { "epoch": 0.96, "learning_rate": 6.849396610811076e-08, "loss": 1.1899, "step": 35293 }, { "epoch": 0.96, "learning_rate": 6.839065802684897e-08, "loss": 1.229, "step": 35294 }, { "epoch": 0.96, "learning_rate": 6.828742764582785e-08, "loss": 1.3433, "step": 35295 }, { "epoch": 0.96, "learning_rate": 6.818427496585678e-08, "loss": 1.394, "step": 35296 }, { "epoch": 0.96, "learning_rate": 6.808119998774176e-08, "loss": 1.1943, "step": 35297 }, { "epoch": 0.96, "learning_rate": 6.797820271228883e-08, "loss": 1.2856, "step": 35298 }, { "epoch": 0.96, "learning_rate": 6.7875283140304e-08, "loss": 1.2651, "step": 35299 }, { "epoch": 0.96, "learning_rate": 6.777244127259219e-08, "loss": 1.2944, "step": 35300 }, { "epoch": 0.96, "learning_rate": 6.766967710995831e-08, "loss": 1.4246, "step": 35301 }, { "epoch": 0.96, "learning_rate": 6.756699065320726e-08, "loss": 1.2515, "step": 35302 }, { "epoch": 0.96, "learning_rate": 6.746438190314064e-08, "loss": 1.2432, "step": 35303 }, { "epoch": 0.96, "learning_rate": 6.736185086056335e-08, "loss": 1.6724, "step": 35304 }, { "epoch": 0.96, "learning_rate": 6.725939752627476e-08, "loss": 1.2498, "step": 35305 }, { "epoch": 0.96, "learning_rate": 6.715702190107865e-08, "loss": 1.3088, "step": 35306 }, { "epoch": 0.96, "learning_rate": 6.70547239857755e-08, "loss": 1.2463, "step": 35307 }, { "epoch": 0.96, "learning_rate": 6.695250378116469e-08, "loss": 1.2874, "step": 35308 }, { "epoch": 0.96, "learning_rate": 6.685036128804779e-08, "loss": 1.1714, "step": 35309 }, { "epoch": 0.96, "learning_rate": 6.674829650722192e-08, "loss": 1.209, "step": 35310 }, { "epoch": 0.96, "learning_rate": 6.664630943948647e-08, "loss": 1.3325, "step": 35311 }, { "epoch": 0.96, "learning_rate": 6.654440008563856e-08, "loss": 1.3115, "step": 35312 }, { "epoch": 0.96, "learning_rate": 6.644256844647757e-08, "loss": 1.3269, "step": 35313 }, { "epoch": 0.96, "learning_rate": 6.63408145227984e-08, "loss": 1.1188, "step": 35314 }, { "epoch": 0.96, "learning_rate": 6.623913831539707e-08, "loss": 1.177, "step": 35315 }, { "epoch": 0.96, "learning_rate": 6.613753982506965e-08, "loss": 1.3423, "step": 35316 }, { "epoch": 0.96, "learning_rate": 6.603601905261214e-08, "loss": 1.3184, "step": 35317 }, { "epoch": 0.96, "learning_rate": 6.593457599881614e-08, "loss": 1.7383, "step": 35318 }, { "epoch": 0.96, "learning_rate": 6.583321066447657e-08, "loss": 1.4858, "step": 35319 }, { "epoch": 0.96, "learning_rate": 6.573192305038723e-08, "loss": 1.4153, "step": 35320 }, { "epoch": 0.96, "learning_rate": 6.563071315734082e-08, "loss": 1.3506, "step": 35321 }, { "epoch": 0.96, "learning_rate": 6.552958098612672e-08, "loss": 1.1001, "step": 35322 }, { "epoch": 0.96, "learning_rate": 6.542852653753761e-08, "loss": 1.386, "step": 35323 }, { "epoch": 0.96, "learning_rate": 6.532754981236511e-08, "loss": 1.3074, "step": 35324 }, { "epoch": 0.96, "learning_rate": 6.522665081139856e-08, "loss": 1.396, "step": 35325 }, { "epoch": 0.96, "learning_rate": 6.512582953542513e-08, "loss": 1.2141, "step": 35326 }, { "epoch": 0.96, "learning_rate": 6.50250859852375e-08, "loss": 1.4526, "step": 35327 }, { "epoch": 0.96, "learning_rate": 6.492442016162059e-08, "loss": 1.3335, "step": 35328 }, { "epoch": 0.96, "learning_rate": 6.48238320653638e-08, "loss": 1.208, "step": 35329 }, { "epoch": 0.96, "learning_rate": 6.472332169725315e-08, "loss": 1.166, "step": 35330 }, { "epoch": 0.96, "learning_rate": 6.462288905807579e-08, "loss": 1.3315, "step": 35331 }, { "epoch": 0.96, "learning_rate": 6.452253414861665e-08, "loss": 1.3555, "step": 35332 }, { "epoch": 0.96, "learning_rate": 6.442225696966175e-08, "loss": 1.3137, "step": 35333 }, { "epoch": 0.96, "learning_rate": 6.432205752199383e-08, "loss": 1.218, "step": 35334 }, { "epoch": 0.96, "learning_rate": 6.42219358063989e-08, "loss": 1.2107, "step": 35335 }, { "epoch": 0.97, "learning_rate": 6.41218918236597e-08, "loss": 1.3174, "step": 35336 }, { "epoch": 0.97, "learning_rate": 6.402192557455777e-08, "loss": 1.2566, "step": 35337 }, { "epoch": 0.97, "learning_rate": 6.392203705987698e-08, "loss": 1.103, "step": 35338 }, { "epoch": 0.97, "learning_rate": 6.38222262803978e-08, "loss": 1.187, "step": 35339 }, { "epoch": 0.97, "learning_rate": 6.372249323690072e-08, "loss": 1.2024, "step": 35340 }, { "epoch": 0.97, "learning_rate": 6.362283793016733e-08, "loss": 1.2703, "step": 35341 }, { "epoch": 0.97, "learning_rate": 6.35232603609759e-08, "loss": 1.3352, "step": 35342 }, { "epoch": 0.97, "learning_rate": 6.342376053010468e-08, "loss": 1.3474, "step": 35343 }, { "epoch": 0.97, "learning_rate": 6.33243384383353e-08, "loss": 1.2854, "step": 35344 }, { "epoch": 0.97, "learning_rate": 6.322499408644378e-08, "loss": 1.1858, "step": 35345 }, { "epoch": 0.97, "learning_rate": 6.312572747520618e-08, "loss": 1.2278, "step": 35346 }, { "epoch": 0.97, "learning_rate": 6.302653860540075e-08, "loss": 1.1194, "step": 35347 }, { "epoch": 0.97, "learning_rate": 6.292742747780245e-08, "loss": 1.321, "step": 35348 }, { "epoch": 0.97, "learning_rate": 6.282839409318842e-08, "loss": 1.2634, "step": 35349 }, { "epoch": 0.97, "learning_rate": 6.272943845233138e-08, "loss": 1.1526, "step": 35350 }, { "epoch": 0.97, "learning_rate": 6.263056055600625e-08, "loss": 1.3931, "step": 35351 }, { "epoch": 0.97, "learning_rate": 6.253176040498687e-08, "loss": 1.2349, "step": 35352 }, { "epoch": 0.97, "learning_rate": 6.243303800004707e-08, "loss": 1.2776, "step": 35353 }, { "epoch": 0.97, "learning_rate": 6.233439334195734e-08, "loss": 1.2317, "step": 35354 }, { "epoch": 0.97, "learning_rate": 6.22358264314904e-08, "loss": 1.384, "step": 35355 }, { "epoch": 0.97, "learning_rate": 6.213733726941674e-08, "loss": 1.2383, "step": 35356 }, { "epoch": 0.97, "learning_rate": 6.203892585650795e-08, "loss": 1.3594, "step": 35357 }, { "epoch": 0.97, "learning_rate": 6.194059219353344e-08, "loss": 1.1963, "step": 35358 }, { "epoch": 0.97, "learning_rate": 6.184233628126258e-08, "loss": 1.3853, "step": 35359 }, { "epoch": 0.97, "learning_rate": 6.174415812046475e-08, "loss": 1.3826, "step": 35360 }, { "epoch": 0.97, "learning_rate": 6.164605771190601e-08, "loss": 1.332, "step": 35361 }, { "epoch": 0.97, "learning_rate": 6.154803505635576e-08, "loss": 1.0935, "step": 35362 }, { "epoch": 0.97, "learning_rate": 6.145009015458004e-08, "loss": 1.4155, "step": 35363 }, { "epoch": 0.97, "learning_rate": 6.1352223007346e-08, "loss": 1.0587, "step": 35364 }, { "epoch": 0.97, "learning_rate": 6.12544336154175e-08, "loss": 1.3938, "step": 35365 }, { "epoch": 0.97, "learning_rate": 6.115672197956168e-08, "loss": 1.1931, "step": 35366 }, { "epoch": 0.97, "learning_rate": 6.105908810054239e-08, "loss": 1.1025, "step": 35367 }, { "epoch": 0.97, "learning_rate": 6.096153197912347e-08, "loss": 1.3005, "step": 35368 }, { "epoch": 0.97, "learning_rate": 6.08640536160665e-08, "loss": 1.2319, "step": 35369 }, { "epoch": 0.97, "learning_rate": 6.076665301213646e-08, "loss": 1.2603, "step": 35370 }, { "epoch": 0.97, "learning_rate": 6.066933016809384e-08, "loss": 1.2129, "step": 35371 }, { "epoch": 0.97, "learning_rate": 6.057208508470136e-08, "loss": 1.2104, "step": 35372 }, { "epoch": 0.97, "learning_rate": 6.04749177627173e-08, "loss": 1.1558, "step": 35373 }, { "epoch": 0.97, "learning_rate": 6.03778282029055e-08, "loss": 1.0972, "step": 35374 }, { "epoch": 0.97, "learning_rate": 6.028081640602313e-08, "loss": 1.3867, "step": 35375 }, { "epoch": 0.97, "learning_rate": 6.018388237282957e-08, "loss": 1.4561, "step": 35376 }, { "epoch": 0.97, "learning_rate": 6.008702610408201e-08, "loss": 1.2053, "step": 35377 }, { "epoch": 0.97, "learning_rate": 5.999024760054095e-08, "loss": 1.2461, "step": 35378 }, { "epoch": 0.97, "learning_rate": 5.989354686296245e-08, "loss": 1.2925, "step": 35379 }, { "epoch": 0.97, "learning_rate": 5.979692389210145e-08, "loss": 1.2444, "step": 35380 }, { "epoch": 0.97, "learning_rate": 5.970037868871514e-08, "loss": 1.0509, "step": 35381 }, { "epoch": 0.97, "learning_rate": 5.9603911253559574e-08, "loss": 1.3386, "step": 35382 }, { "epoch": 0.97, "learning_rate": 5.950752158738859e-08, "loss": 1.3018, "step": 35383 }, { "epoch": 0.97, "learning_rate": 5.941120969095604e-08, "loss": 1.1277, "step": 35384 }, { "epoch": 0.97, "learning_rate": 5.931497556501575e-08, "loss": 1.2388, "step": 35385 }, { "epoch": 0.97, "learning_rate": 5.9218819210320466e-08, "loss": 1.135, "step": 35386 }, { "epoch": 0.97, "learning_rate": 5.912274062762402e-08, "loss": 1.2437, "step": 35387 }, { "epoch": 0.97, "learning_rate": 5.9026739817675814e-08, "loss": 1.2993, "step": 35388 }, { "epoch": 0.97, "learning_rate": 5.8930816781227475e-08, "loss": 1.1887, "step": 35389 }, { "epoch": 0.97, "learning_rate": 5.88349715190295e-08, "loss": 1.3872, "step": 35390 }, { "epoch": 0.97, "learning_rate": 5.873920403183353e-08, "loss": 1.2612, "step": 35391 }, { "epoch": 0.97, "learning_rate": 5.864351432038562e-08, "loss": 1.2717, "step": 35392 }, { "epoch": 0.97, "learning_rate": 5.85479023854374e-08, "loss": 1.2402, "step": 35393 }, { "epoch": 0.97, "learning_rate": 5.8452368227734924e-08, "loss": 1.4617, "step": 35394 }, { "epoch": 0.97, "learning_rate": 5.8356911848026496e-08, "loss": 1.3125, "step": 35395 }, { "epoch": 0.97, "learning_rate": 5.82615332470593e-08, "loss": 1.3528, "step": 35396 }, { "epoch": 0.97, "learning_rate": 5.816623242557717e-08, "loss": 1.3276, "step": 35397 }, { "epoch": 0.97, "learning_rate": 5.807100938432841e-08, "loss": 1.176, "step": 35398 }, { "epoch": 0.97, "learning_rate": 5.797586412405798e-08, "loss": 1.3406, "step": 35399 }, { "epoch": 0.97, "learning_rate": 5.788079664550861e-08, "loss": 1.1172, "step": 35400 }, { "epoch": 0.97, "learning_rate": 5.778580694942415e-08, "loss": 1.2319, "step": 35401 }, { "epoch": 0.97, "learning_rate": 5.7690895036549564e-08, "loss": 1.2214, "step": 35402 }, { "epoch": 0.97, "learning_rate": 5.759606090762537e-08, "loss": 1.104, "step": 35403 }, { "epoch": 0.97, "learning_rate": 5.7501304563394314e-08, "loss": 1.3098, "step": 35404 }, { "epoch": 0.97, "learning_rate": 5.740662600459801e-08, "loss": 1.3594, "step": 35405 }, { "epoch": 0.97, "learning_rate": 5.731202523197699e-08, "loss": 1.1753, "step": 35406 }, { "epoch": 0.97, "learning_rate": 5.721750224627176e-08, "loss": 1.3398, "step": 35407 }, { "epoch": 0.97, "learning_rate": 5.712305704822063e-08, "loss": 1.2939, "step": 35408 }, { "epoch": 0.97, "learning_rate": 5.702868963856301e-08, "loss": 1.4146, "step": 35409 }, { "epoch": 0.97, "learning_rate": 5.6934400018038295e-08, "loss": 1.1228, "step": 35410 }, { "epoch": 0.97, "learning_rate": 5.684018818738257e-08, "loss": 1.3174, "step": 35411 }, { "epoch": 0.97, "learning_rate": 5.6746054147334136e-08, "loss": 1.2827, "step": 35412 }, { "epoch": 0.97, "learning_rate": 5.665199789862907e-08, "loss": 1.2522, "step": 35413 }, { "epoch": 0.97, "learning_rate": 5.6558019442002344e-08, "loss": 1.1747, "step": 35414 }, { "epoch": 0.97, "learning_rate": 5.646411877819113e-08, "loss": 1.3623, "step": 35415 }, { "epoch": 0.97, "learning_rate": 5.6370295907927085e-08, "loss": 1.1594, "step": 35416 }, { "epoch": 0.97, "learning_rate": 5.627655083194739e-08, "loss": 1.1425, "step": 35417 }, { "epoch": 0.97, "learning_rate": 5.618288355098367e-08, "loss": 1.3005, "step": 35418 }, { "epoch": 0.97, "learning_rate": 5.608929406576868e-08, "loss": 1.1572, "step": 35419 }, { "epoch": 0.97, "learning_rate": 5.599578237703629e-08, "loss": 1.6802, "step": 35420 }, { "epoch": 0.97, "learning_rate": 5.59023484855159e-08, "loss": 1.2666, "step": 35421 }, { "epoch": 0.97, "learning_rate": 5.580899239194026e-08, "loss": 1.3452, "step": 35422 }, { "epoch": 0.97, "learning_rate": 5.5715714097037685e-08, "loss": 1.302, "step": 35423 }, { "epoch": 0.97, "learning_rate": 5.5622513601539805e-08, "loss": 1.26, "step": 35424 }, { "epoch": 0.97, "learning_rate": 5.552939090617493e-08, "loss": 1.47, "step": 35425 }, { "epoch": 0.97, "learning_rate": 5.543634601167358e-08, "loss": 1.1333, "step": 35426 }, { "epoch": 0.97, "learning_rate": 5.534337891876074e-08, "loss": 1.2883, "step": 35427 }, { "epoch": 0.97, "learning_rate": 5.5250489628164705e-08, "loss": 1.3188, "step": 35428 }, { "epoch": 0.97, "learning_rate": 5.5157678140612684e-08, "loss": 1.2104, "step": 35429 }, { "epoch": 0.97, "learning_rate": 5.506494445683186e-08, "loss": 1.3408, "step": 35430 }, { "epoch": 0.97, "learning_rate": 5.4972288577545e-08, "loss": 1.3152, "step": 35431 }, { "epoch": 0.97, "learning_rate": 5.4879710503478176e-08, "loss": 1.2678, "step": 35432 }, { "epoch": 0.97, "learning_rate": 5.478721023535638e-08, "loss": 1.8032, "step": 35433 }, { "epoch": 0.97, "learning_rate": 5.469478777390347e-08, "loss": 1.1797, "step": 35434 }, { "epoch": 0.97, "learning_rate": 5.46024431198422e-08, "loss": 1.3044, "step": 35435 }, { "epoch": 0.97, "learning_rate": 5.451017627389421e-08, "loss": 1.208, "step": 35436 }, { "epoch": 0.97, "learning_rate": 5.4417987236781156e-08, "loss": 1.3037, "step": 35437 }, { "epoch": 0.97, "learning_rate": 5.4325876009226895e-08, "loss": 1.2148, "step": 35438 }, { "epoch": 0.97, "learning_rate": 5.4233842591948635e-08, "loss": 1.1719, "step": 35439 }, { "epoch": 0.97, "learning_rate": 5.414188698566803e-08, "loss": 1.2429, "step": 35440 }, { "epoch": 0.97, "learning_rate": 5.405000919110448e-08, "loss": 1.2959, "step": 35441 }, { "epoch": 0.97, "learning_rate": 5.395820920897743e-08, "loss": 1.3206, "step": 35442 }, { "epoch": 0.97, "learning_rate": 5.3866487040004076e-08, "loss": 1.4385, "step": 35443 }, { "epoch": 0.97, "learning_rate": 5.377484268490163e-08, "loss": 1.1643, "step": 35444 }, { "epoch": 0.97, "learning_rate": 5.36832761443884e-08, "loss": 1.3376, "step": 35445 }, { "epoch": 0.97, "learning_rate": 5.3591787419180475e-08, "loss": 1.2351, "step": 35446 }, { "epoch": 0.97, "learning_rate": 5.350037650999284e-08, "loss": 1.2244, "step": 35447 }, { "epoch": 0.97, "learning_rate": 5.340904341754049e-08, "loss": 1.3108, "step": 35448 }, { "epoch": 0.97, "learning_rate": 5.331778814253952e-08, "loss": 1.1082, "step": 35449 }, { "epoch": 0.97, "learning_rate": 5.322661068570267e-08, "loss": 1.1926, "step": 35450 }, { "epoch": 0.97, "learning_rate": 5.313551104774384e-08, "loss": 1.2593, "step": 35451 }, { "epoch": 0.97, "learning_rate": 5.3044489229374665e-08, "loss": 1.1528, "step": 35452 }, { "epoch": 0.97, "learning_rate": 5.2953545231309024e-08, "loss": 1.2192, "step": 35453 }, { "epoch": 0.97, "learning_rate": 5.2862679054256347e-08, "loss": 1.1797, "step": 35454 }, { "epoch": 0.97, "learning_rate": 5.2771890698929404e-08, "loss": 1.8125, "step": 35455 }, { "epoch": 0.97, "learning_rate": 5.2681180166036515e-08, "loss": 1.2078, "step": 35456 }, { "epoch": 0.97, "learning_rate": 5.2590547456290444e-08, "loss": 1.2527, "step": 35457 }, { "epoch": 0.97, "learning_rate": 5.2499992570397285e-08, "loss": 1.2876, "step": 35458 }, { "epoch": 0.97, "learning_rate": 5.240951550906537e-08, "loss": 1.1152, "step": 35459 }, { "epoch": 0.97, "learning_rate": 5.2319116273005235e-08, "loss": 1.3486, "step": 35460 }, { "epoch": 0.97, "learning_rate": 5.2228794862921874e-08, "loss": 1.2151, "step": 35461 }, { "epoch": 0.97, "learning_rate": 5.2138551279523606e-08, "loss": 1.2791, "step": 35462 }, { "epoch": 0.97, "learning_rate": 5.204838552351432e-08, "loss": 1.2363, "step": 35463 }, { "epoch": 0.97, "learning_rate": 5.195829759560123e-08, "loss": 1.2688, "step": 35464 }, { "epoch": 0.97, "learning_rate": 5.1868287496488204e-08, "loss": 1.2734, "step": 35465 }, { "epoch": 0.97, "learning_rate": 5.1778355226880236e-08, "loss": 1.1501, "step": 35466 }, { "epoch": 0.97, "learning_rate": 5.168850078748011e-08, "loss": 1.3074, "step": 35467 }, { "epoch": 0.97, "learning_rate": 5.1598724178991696e-08, "loss": 1.1072, "step": 35468 }, { "epoch": 0.97, "learning_rate": 5.150902540211666e-08, "loss": 1.3064, "step": 35469 }, { "epoch": 0.97, "learning_rate": 5.141940445755555e-08, "loss": 1.2375, "step": 35470 }, { "epoch": 0.97, "learning_rate": 5.132986134601225e-08, "loss": 1.2598, "step": 35471 }, { "epoch": 0.97, "learning_rate": 5.1240396068185095e-08, "loss": 1.283, "step": 35472 }, { "epoch": 0.97, "learning_rate": 5.115100862477573e-08, "loss": 1.1329, "step": 35473 }, { "epoch": 0.97, "learning_rate": 5.1061699016482504e-08, "loss": 1.3936, "step": 35474 }, { "epoch": 0.97, "learning_rate": 5.097246724400373e-08, "loss": 1.0806, "step": 35475 }, { "epoch": 0.97, "learning_rate": 5.088331330803775e-08, "loss": 1.1301, "step": 35476 }, { "epoch": 0.97, "learning_rate": 5.079423720928289e-08, "loss": 1.3679, "step": 35477 }, { "epoch": 0.97, "learning_rate": 5.0705238948435264e-08, "loss": 1.2, "step": 35478 }, { "epoch": 0.97, "learning_rate": 5.061631852619209e-08, "loss": 1.0895, "step": 35479 }, { "epoch": 0.97, "learning_rate": 5.052747594324725e-08, "loss": 1.156, "step": 35480 }, { "epoch": 0.97, "learning_rate": 5.0438711200296865e-08, "loss": 1.2266, "step": 35481 }, { "epoch": 0.97, "learning_rate": 5.0350024298035926e-08, "loss": 1.2109, "step": 35482 }, { "epoch": 0.97, "learning_rate": 5.026141523715722e-08, "loss": 1.26, "step": 35483 }, { "epoch": 0.97, "learning_rate": 5.0172884018354626e-08, "loss": 1.282, "step": 35484 }, { "epoch": 0.97, "learning_rate": 5.008443064232094e-08, "loss": 1.3044, "step": 35485 }, { "epoch": 0.97, "learning_rate": 4.999605510974892e-08, "loss": 1.2244, "step": 35486 }, { "epoch": 0.97, "learning_rate": 4.990775742132692e-08, "loss": 0.9934, "step": 35487 }, { "epoch": 0.97, "learning_rate": 4.9819537577748825e-08, "loss": 1.2244, "step": 35488 }, { "epoch": 0.97, "learning_rate": 4.9731395579704076e-08, "loss": 1.1689, "step": 35489 }, { "epoch": 0.97, "learning_rate": 4.964333142788102e-08, "loss": 1.2942, "step": 35490 }, { "epoch": 0.97, "learning_rate": 4.955534512297022e-08, "loss": 1.2981, "step": 35491 }, { "epoch": 0.97, "learning_rate": 4.9467436665658896e-08, "loss": 1.1877, "step": 35492 }, { "epoch": 0.97, "learning_rate": 4.93796060566365e-08, "loss": 1.238, "step": 35493 }, { "epoch": 0.97, "learning_rate": 4.9291853296588036e-08, "loss": 1.1704, "step": 35494 }, { "epoch": 0.97, "learning_rate": 4.920417838620073e-08, "loss": 1.323, "step": 35495 }, { "epoch": 0.97, "learning_rate": 4.911658132616071e-08, "loss": 1.2319, "step": 35496 }, { "epoch": 0.97, "learning_rate": 4.902906211715408e-08, "loss": 1.2856, "step": 35497 }, { "epoch": 0.97, "learning_rate": 4.894162075986475e-08, "loss": 1.1769, "step": 35498 }, { "epoch": 0.97, "learning_rate": 4.88542572549755e-08, "loss": 1.2671, "step": 35499 }, { "epoch": 0.97, "learning_rate": 4.876697160317245e-08, "loss": 1.2229, "step": 35500 }, { "epoch": 0.97, "learning_rate": 4.867976380513728e-08, "loss": 1.126, "step": 35501 }, { "epoch": 0.97, "learning_rate": 4.859263386155055e-08, "loss": 1.1704, "step": 35502 }, { "epoch": 0.97, "learning_rate": 4.8505581773097274e-08, "loss": 1.1836, "step": 35503 }, { "epoch": 0.97, "learning_rate": 4.8418607540456905e-08, "loss": 1.269, "step": 35504 }, { "epoch": 0.97, "learning_rate": 4.83317111643089e-08, "loss": 1.2537, "step": 35505 }, { "epoch": 0.97, "learning_rate": 4.824489264533383e-08, "loss": 1.3711, "step": 35506 }, { "epoch": 0.97, "learning_rate": 4.8158151984212254e-08, "loss": 1.2969, "step": 35507 }, { "epoch": 0.97, "learning_rate": 4.80714891816203e-08, "loss": 1.2202, "step": 35508 }, { "epoch": 0.97, "learning_rate": 4.7984904238238537e-08, "loss": 1.4001, "step": 35509 }, { "epoch": 0.97, "learning_rate": 4.789839715474198e-08, "loss": 1.3628, "step": 35510 }, { "epoch": 0.97, "learning_rate": 4.781196793180898e-08, "loss": 1.2515, "step": 35511 }, { "epoch": 0.97, "learning_rate": 4.772561657011565e-08, "loss": 1.3821, "step": 35512 }, { "epoch": 0.97, "learning_rate": 4.763934307033702e-08, "loss": 1.7822, "step": 35513 }, { "epoch": 0.97, "learning_rate": 4.755314743314809e-08, "loss": 1.2141, "step": 35514 }, { "epoch": 0.97, "learning_rate": 4.7467029659223895e-08, "loss": 1.325, "step": 35515 }, { "epoch": 0.97, "learning_rate": 4.7380989749237216e-08, "loss": 1.3416, "step": 35516 }, { "epoch": 0.97, "learning_rate": 4.7295027703860854e-08, "loss": 1.2637, "step": 35517 }, { "epoch": 0.97, "learning_rate": 4.720914352376871e-08, "loss": 1.2007, "step": 35518 }, { "epoch": 0.97, "learning_rate": 4.712333720963247e-08, "loss": 1.188, "step": 35519 }, { "epoch": 0.97, "learning_rate": 4.703760876212271e-08, "loss": 1.1121, "step": 35520 }, { "epoch": 0.97, "learning_rate": 4.695195818191001e-08, "loss": 1.3616, "step": 35521 }, { "epoch": 0.97, "learning_rate": 4.686638546966604e-08, "loss": 1.2307, "step": 35522 }, { "epoch": 0.97, "learning_rate": 4.6780890626058064e-08, "loss": 1.3301, "step": 35523 }, { "epoch": 0.97, "learning_rate": 4.669547365175775e-08, "loss": 1.1714, "step": 35524 }, { "epoch": 0.97, "learning_rate": 4.661013454743013e-08, "loss": 1.239, "step": 35525 }, { "epoch": 0.97, "learning_rate": 4.652487331374467e-08, "loss": 1.207, "step": 35526 }, { "epoch": 0.97, "learning_rate": 4.643968995136861e-08, "loss": 1.2739, "step": 35527 }, { "epoch": 0.97, "learning_rate": 4.635458446096697e-08, "loss": 1.3184, "step": 35528 }, { "epoch": 0.97, "learning_rate": 4.6269556843208105e-08, "loss": 1.1619, "step": 35529 }, { "epoch": 0.97, "learning_rate": 4.618460709875483e-08, "loss": 1.0977, "step": 35530 }, { "epoch": 0.97, "learning_rate": 4.609973522827216e-08, "loss": 1.3413, "step": 35531 }, { "epoch": 0.97, "learning_rate": 4.6014941232425116e-08, "loss": 1.2207, "step": 35532 }, { "epoch": 0.97, "learning_rate": 4.5930225111876506e-08, "loss": 1.3093, "step": 35533 }, { "epoch": 0.97, "learning_rate": 4.584558686728802e-08, "loss": 1.2305, "step": 35534 }, { "epoch": 0.97, "learning_rate": 4.576102649932357e-08, "loss": 1.2158, "step": 35535 }, { "epoch": 0.97, "learning_rate": 4.567654400864485e-08, "loss": 1.2234, "step": 35536 }, { "epoch": 0.97, "learning_rate": 4.5592139395911336e-08, "loss": 1.2007, "step": 35537 }, { "epoch": 0.97, "learning_rate": 4.550781266178361e-08, "loss": 1.1477, "step": 35538 }, { "epoch": 0.97, "learning_rate": 4.542356380692226e-08, "loss": 1.2314, "step": 35539 }, { "epoch": 0.97, "learning_rate": 4.533939283198563e-08, "loss": 1.217, "step": 35540 }, { "epoch": 0.97, "learning_rate": 4.5255299737633206e-08, "loss": 1.3955, "step": 35541 }, { "epoch": 0.97, "learning_rate": 4.517128452452113e-08, "loss": 1.3499, "step": 35542 }, { "epoch": 0.97, "learning_rate": 4.5087347193308873e-08, "loss": 1.1702, "step": 35543 }, { "epoch": 0.97, "learning_rate": 4.5003487744652574e-08, "loss": 1.2856, "step": 35544 }, { "epoch": 0.97, "learning_rate": 4.491970617920727e-08, "loss": 1.3955, "step": 35545 }, { "epoch": 0.97, "learning_rate": 4.4836002497627985e-08, "loss": 1.1768, "step": 35546 }, { "epoch": 0.97, "learning_rate": 4.4752376700571974e-08, "loss": 1.3335, "step": 35547 }, { "epoch": 0.97, "learning_rate": 4.4668828788690945e-08, "loss": 1.1777, "step": 35548 }, { "epoch": 0.97, "learning_rate": 4.458535876263992e-08, "loss": 1.2551, "step": 35549 }, { "epoch": 0.97, "learning_rate": 4.450196662307171e-08, "loss": 1.2446, "step": 35550 }, { "epoch": 0.97, "learning_rate": 4.4418652370639135e-08, "loss": 1.3916, "step": 35551 }, { "epoch": 0.97, "learning_rate": 4.433541600599389e-08, "loss": 1.2285, "step": 35552 }, { "epoch": 0.97, "learning_rate": 4.425225752978657e-08, "loss": 1.249, "step": 35553 }, { "epoch": 0.97, "learning_rate": 4.416917694266776e-08, "loss": 1.1914, "step": 35554 }, { "epoch": 0.97, "learning_rate": 4.408617424528805e-08, "loss": 1.2671, "step": 35555 }, { "epoch": 0.97, "learning_rate": 4.400324943829581e-08, "loss": 1.3027, "step": 35556 }, { "epoch": 0.97, "learning_rate": 4.392040252234164e-08, "loss": 1.2378, "step": 35557 }, { "epoch": 0.97, "learning_rate": 4.383763349807168e-08, "loss": 1.2134, "step": 35558 }, { "epoch": 0.97, "learning_rate": 4.375494236613431e-08, "loss": 1.3855, "step": 35559 }, { "epoch": 0.97, "learning_rate": 4.367232912717678e-08, "loss": 1.3113, "step": 35560 }, { "epoch": 0.97, "learning_rate": 4.3589793781845244e-08, "loss": 1.2305, "step": 35561 }, { "epoch": 0.97, "learning_rate": 4.3507336330785856e-08, "loss": 1.1902, "step": 35562 }, { "epoch": 0.97, "learning_rate": 4.342495677464253e-08, "loss": 1.0808, "step": 35563 }, { "epoch": 0.97, "learning_rate": 4.334265511406033e-08, "loss": 1.3013, "step": 35564 }, { "epoch": 0.97, "learning_rate": 4.3260431349683166e-08, "loss": 1.176, "step": 35565 }, { "epoch": 0.97, "learning_rate": 4.317828548215497e-08, "loss": 1.1965, "step": 35566 }, { "epoch": 0.97, "learning_rate": 4.3096217512117454e-08, "loss": 1.2361, "step": 35567 }, { "epoch": 0.97, "learning_rate": 4.301422744021344e-08, "loss": 1.196, "step": 35568 }, { "epoch": 0.97, "learning_rate": 4.2932315267083525e-08, "loss": 1.1587, "step": 35569 }, { "epoch": 0.97, "learning_rate": 4.2850480993369414e-08, "loss": 1.2729, "step": 35570 }, { "epoch": 0.97, "learning_rate": 4.27687246197106e-08, "loss": 1.262, "step": 35571 }, { "epoch": 0.97, "learning_rate": 4.268704614674768e-08, "loss": 1.1038, "step": 35572 }, { "epoch": 0.97, "learning_rate": 4.2605445575117924e-08, "loss": 1.064, "step": 35573 }, { "epoch": 0.97, "learning_rate": 4.252392290546192e-08, "loss": 1.1233, "step": 35574 }, { "epoch": 0.97, "learning_rate": 4.244247813841584e-08, "loss": 1.1637, "step": 35575 }, { "epoch": 0.97, "learning_rate": 4.236111127461806e-08, "loss": 1.1992, "step": 35576 }, { "epoch": 0.97, "learning_rate": 4.2279822314703625e-08, "loss": 1.2021, "step": 35577 }, { "epoch": 0.97, "learning_rate": 4.21986112593098e-08, "loss": 1.2439, "step": 35578 }, { "epoch": 0.97, "learning_rate": 4.211747810907163e-08, "loss": 1.3413, "step": 35579 }, { "epoch": 0.97, "learning_rate": 4.203642286462417e-08, "loss": 1.2214, "step": 35580 }, { "epoch": 0.97, "learning_rate": 4.1955445526600245e-08, "loss": 1.3467, "step": 35581 }, { "epoch": 0.97, "learning_rate": 4.187454609563601e-08, "loss": 1.2532, "step": 35582 }, { "epoch": 0.97, "learning_rate": 4.179372457236097e-08, "loss": 1.2002, "step": 35583 }, { "epoch": 0.97, "learning_rate": 4.1712980957410166e-08, "loss": 1.2317, "step": 35584 }, { "epoch": 0.97, "learning_rate": 4.163231525141309e-08, "loss": 1.2988, "step": 35585 }, { "epoch": 0.97, "learning_rate": 4.155172745500369e-08, "loss": 1.2297, "step": 35586 }, { "epoch": 0.97, "learning_rate": 4.147121756880923e-08, "loss": 1.3115, "step": 35587 }, { "epoch": 0.97, "learning_rate": 4.139078559346255e-08, "loss": 1.2607, "step": 35588 }, { "epoch": 0.97, "learning_rate": 4.13104315295898e-08, "loss": 1.167, "step": 35589 }, { "epoch": 0.97, "learning_rate": 4.123015537782271e-08, "loss": 1.1897, "step": 35590 }, { "epoch": 0.97, "learning_rate": 4.1149957138787444e-08, "loss": 1.2996, "step": 35591 }, { "epoch": 0.97, "learning_rate": 4.1069836813112385e-08, "loss": 1.2114, "step": 35592 }, { "epoch": 0.97, "learning_rate": 4.0989794401423696e-08, "loss": 1.2837, "step": 35593 }, { "epoch": 0.97, "learning_rate": 4.090982990434644e-08, "loss": 1.4031, "step": 35594 }, { "epoch": 0.97, "learning_rate": 4.082994332251011e-08, "loss": 1.082, "step": 35595 }, { "epoch": 0.97, "learning_rate": 4.0750134656535324e-08, "loss": 1.2874, "step": 35596 }, { "epoch": 0.97, "learning_rate": 4.067040390704824e-08, "loss": 1.2542, "step": 35597 }, { "epoch": 0.97, "learning_rate": 4.0590751074673914e-08, "loss": 1.2949, "step": 35598 }, { "epoch": 0.97, "learning_rate": 4.0511176160034085e-08, "loss": 1.2356, "step": 35599 }, { "epoch": 0.97, "learning_rate": 4.043167916375046e-08, "loss": 1.2205, "step": 35600 }, { "epoch": 0.97, "learning_rate": 4.035226008644699e-08, "loss": 1.1274, "step": 35601 }, { "epoch": 0.97, "learning_rate": 4.0272918928743185e-08, "loss": 1.2307, "step": 35602 }, { "epoch": 0.97, "learning_rate": 4.0193655691261876e-08, "loss": 1.2123, "step": 35603 }, { "epoch": 0.97, "learning_rate": 4.011447037462146e-08, "loss": 1.167, "step": 35604 }, { "epoch": 0.97, "learning_rate": 4.003536297944144e-08, "loss": 1.2839, "step": 35605 }, { "epoch": 0.97, "learning_rate": 3.9956333506342427e-08, "loss": 1.1914, "step": 35606 }, { "epoch": 0.97, "learning_rate": 3.98773819559406e-08, "loss": 1.3379, "step": 35607 }, { "epoch": 0.97, "learning_rate": 3.979850832885435e-08, "loss": 1.3906, "step": 35608 }, { "epoch": 0.97, "learning_rate": 3.971971262570096e-08, "loss": 1.2158, "step": 35609 }, { "epoch": 0.97, "learning_rate": 3.9640994847097714e-08, "loss": 1.1155, "step": 35610 }, { "epoch": 0.97, "learning_rate": 3.956235499365968e-08, "loss": 1.219, "step": 35611 }, { "epoch": 0.97, "learning_rate": 3.948379306600192e-08, "loss": 1.3655, "step": 35612 }, { "epoch": 0.97, "learning_rate": 3.940530906473838e-08, "loss": 1.1921, "step": 35613 }, { "epoch": 0.97, "learning_rate": 3.932690299048414e-08, "loss": 1.3464, "step": 35614 }, { "epoch": 0.97, "learning_rate": 3.924857484385314e-08, "loss": 1.0229, "step": 35615 }, { "epoch": 0.97, "learning_rate": 3.9170324625456e-08, "loss": 1.1672, "step": 35616 }, { "epoch": 0.97, "learning_rate": 3.9092152335907795e-08, "loss": 1.2727, "step": 35617 }, { "epoch": 0.97, "learning_rate": 3.901405797581803e-08, "loss": 1.3306, "step": 35618 }, { "epoch": 0.97, "learning_rate": 3.893604154579844e-08, "loss": 1.0193, "step": 35619 }, { "epoch": 0.97, "learning_rate": 3.885810304645854e-08, "loss": 1.2354, "step": 35620 }, { "epoch": 0.97, "learning_rate": 3.8780242478410057e-08, "loss": 1.049, "step": 35621 }, { "epoch": 0.97, "learning_rate": 3.870245984226029e-08, "loss": 1.2485, "step": 35622 }, { "epoch": 0.97, "learning_rate": 3.862475513861763e-08, "loss": 1.0854, "step": 35623 }, { "epoch": 0.97, "learning_rate": 3.85471283680916e-08, "loss": 1.748, "step": 35624 }, { "epoch": 0.97, "learning_rate": 3.846957953128838e-08, "loss": 1.283, "step": 35625 }, { "epoch": 0.97, "learning_rate": 3.839210862881526e-08, "loss": 1.1606, "step": 35626 }, { "epoch": 0.97, "learning_rate": 3.831471566127731e-08, "loss": 1.197, "step": 35627 }, { "epoch": 0.97, "learning_rate": 3.823740062928072e-08, "loss": 1.1567, "step": 35628 }, { "epoch": 0.97, "learning_rate": 3.816016353343055e-08, "loss": 1.2356, "step": 35629 }, { "epoch": 0.97, "learning_rate": 3.8083004374330765e-08, "loss": 1.187, "step": 35630 }, { "epoch": 0.97, "learning_rate": 3.800592315258644e-08, "loss": 1.2688, "step": 35631 }, { "epoch": 0.97, "learning_rate": 3.79289198687971e-08, "loss": 1.3569, "step": 35632 }, { "epoch": 0.97, "learning_rate": 3.785199452356891e-08, "loss": 1.2188, "step": 35633 }, { "epoch": 0.97, "learning_rate": 3.777514711750252e-08, "loss": 1.3174, "step": 35634 }, { "epoch": 0.97, "learning_rate": 3.7698377651197437e-08, "loss": 1.199, "step": 35635 }, { "epoch": 0.97, "learning_rate": 3.7621686125256516e-08, "loss": 1.2961, "step": 35636 }, { "epoch": 0.97, "learning_rate": 3.754507254027817e-08, "loss": 1.3245, "step": 35637 }, { "epoch": 0.97, "learning_rate": 3.746853689686303e-08, "loss": 1.3477, "step": 35638 }, { "epoch": 0.97, "learning_rate": 3.73920791956095e-08, "loss": 1.2007, "step": 35639 }, { "epoch": 0.97, "learning_rate": 3.731569943711599e-08, "loss": 1.3477, "step": 35640 }, { "epoch": 0.97, "learning_rate": 3.72393976219787e-08, "loss": 1.2234, "step": 35641 }, { "epoch": 0.97, "learning_rate": 3.7163173750796034e-08, "loss": 1.1155, "step": 35642 }, { "epoch": 0.97, "learning_rate": 3.708702782416307e-08, "loss": 1.2654, "step": 35643 }, { "epoch": 0.97, "learning_rate": 3.701095984267711e-08, "loss": 1.2249, "step": 35644 }, { "epoch": 0.97, "learning_rate": 3.693496980693212e-08, "loss": 1.4536, "step": 35645 }, { "epoch": 0.97, "learning_rate": 3.685905771752429e-08, "loss": 1.2295, "step": 35646 }, { "epoch": 0.97, "learning_rate": 3.678322357504427e-08, "loss": 1.1851, "step": 35647 }, { "epoch": 0.97, "learning_rate": 3.670746738008823e-08, "loss": 1.2375, "step": 35648 }, { "epoch": 0.97, "learning_rate": 3.663178913324794e-08, "loss": 1.2019, "step": 35649 }, { "epoch": 0.97, "learning_rate": 3.6556188835115134e-08, "loss": 1.3206, "step": 35650 }, { "epoch": 0.97, "learning_rate": 3.648066648628157e-08, "loss": 1.3428, "step": 35651 }, { "epoch": 0.97, "learning_rate": 3.640522208733899e-08, "loss": 1.2019, "step": 35652 }, { "epoch": 0.97, "learning_rate": 3.632985563887581e-08, "loss": 1.3442, "step": 35653 }, { "epoch": 0.97, "learning_rate": 3.625456714148268e-08, "loss": 1.1658, "step": 35654 }, { "epoch": 0.97, "learning_rate": 3.617935659574801e-08, "loss": 1.2542, "step": 35655 }, { "epoch": 0.97, "learning_rate": 3.610422400226132e-08, "loss": 1.1714, "step": 35656 }, { "epoch": 0.97, "learning_rate": 3.602916936160994e-08, "loss": 1.1797, "step": 35657 }, { "epoch": 0.97, "learning_rate": 3.5954192674381163e-08, "loss": 1.2957, "step": 35658 }, { "epoch": 0.97, "learning_rate": 3.587929394116119e-08, "loss": 1.2356, "step": 35659 }, { "epoch": 0.97, "learning_rate": 3.5804473162535104e-08, "loss": 1.3225, "step": 35660 }, { "epoch": 0.97, "learning_rate": 3.572973033909022e-08, "loss": 1.343, "step": 35661 }, { "epoch": 0.97, "learning_rate": 3.565506547141051e-08, "loss": 1.2007, "step": 35662 }, { "epoch": 0.97, "learning_rate": 3.5580478560081066e-08, "loss": 1.3398, "step": 35663 }, { "epoch": 0.97, "learning_rate": 3.5505969605682536e-08, "loss": 1.1707, "step": 35664 }, { "epoch": 0.97, "learning_rate": 3.5431538608799995e-08, "loss": 1.1965, "step": 35665 }, { "epoch": 0.97, "learning_rate": 3.535718557001633e-08, "loss": 1.238, "step": 35666 }, { "epoch": 0.97, "learning_rate": 3.528291048991217e-08, "loss": 1.283, "step": 35667 }, { "epoch": 0.97, "learning_rate": 3.520871336906706e-08, "loss": 1.2673, "step": 35668 }, { "epoch": 0.97, "learning_rate": 3.5134594208064974e-08, "loss": 1.291, "step": 35669 }, { "epoch": 0.97, "learning_rate": 3.506055300748434e-08, "loss": 1.3162, "step": 35670 }, { "epoch": 0.97, "learning_rate": 3.498658976790248e-08, "loss": 1.158, "step": 35671 }, { "epoch": 0.97, "learning_rate": 3.491270448990114e-08, "loss": 1.3496, "step": 35672 }, { "epoch": 0.97, "learning_rate": 3.483889717405542e-08, "loss": 1.137, "step": 35673 }, { "epoch": 0.97, "learning_rate": 3.4765167820945965e-08, "loss": 1.2686, "step": 35674 }, { "epoch": 0.97, "learning_rate": 3.4691516431146767e-08, "loss": 1.1858, "step": 35675 }, { "epoch": 0.97, "learning_rate": 3.461794300523513e-08, "loss": 1.4233, "step": 35676 }, { "epoch": 0.97, "learning_rate": 3.454444754378616e-08, "loss": 1.1731, "step": 35677 }, { "epoch": 0.97, "learning_rate": 3.447103004737606e-08, "loss": 1.3948, "step": 35678 }, { "epoch": 0.97, "learning_rate": 3.439769051657882e-08, "loss": 1.1956, "step": 35679 }, { "epoch": 0.97, "learning_rate": 3.43244289519673e-08, "loss": 1.1603, "step": 35680 }, { "epoch": 0.97, "learning_rate": 3.4251245354115506e-08, "loss": 1.2629, "step": 35681 }, { "epoch": 0.97, "learning_rate": 3.4178139723596296e-08, "loss": 1.1482, "step": 35682 }, { "epoch": 0.97, "learning_rate": 3.4105112060980326e-08, "loss": 1.0779, "step": 35683 }, { "epoch": 0.97, "learning_rate": 3.403216236683937e-08, "loss": 1.2153, "step": 35684 }, { "epoch": 0.97, "learning_rate": 3.395929064174519e-08, "loss": 1.3491, "step": 35685 }, { "epoch": 0.97, "learning_rate": 3.388649688626733e-08, "loss": 1.197, "step": 35686 }, { "epoch": 0.97, "learning_rate": 3.3813781100974216e-08, "loss": 1.2036, "step": 35687 }, { "epoch": 0.97, "learning_rate": 3.374114328643541e-08, "loss": 1.3154, "step": 35688 }, { "epoch": 0.97, "learning_rate": 3.3668583443220437e-08, "loss": 1.3477, "step": 35689 }, { "epoch": 0.97, "learning_rate": 3.3596101571895524e-08, "loss": 1.3474, "step": 35690 }, { "epoch": 0.97, "learning_rate": 3.3523697673029095e-08, "loss": 1.2871, "step": 35691 }, { "epoch": 0.97, "learning_rate": 3.3451371747185155e-08, "loss": 1.6265, "step": 35692 }, { "epoch": 0.97, "learning_rate": 3.3379123794932136e-08, "loss": 1.3047, "step": 35693 }, { "epoch": 0.97, "learning_rate": 3.330695381683402e-08, "loss": 1.2664, "step": 35694 }, { "epoch": 0.97, "learning_rate": 3.323486181345481e-08, "loss": 1.2996, "step": 35695 }, { "epoch": 0.97, "learning_rate": 3.316284778536072e-08, "loss": 1.1777, "step": 35696 }, { "epoch": 0.97, "learning_rate": 3.309091173311352e-08, "loss": 1.2729, "step": 35697 }, { "epoch": 0.97, "learning_rate": 3.301905365727498e-08, "loss": 1.3064, "step": 35698 }, { "epoch": 0.97, "learning_rate": 3.294727355841021e-08, "loss": 1.1785, "step": 35699 }, { "epoch": 0.97, "learning_rate": 3.2875571437077645e-08, "loss": 1.3008, "step": 35700 }, { "epoch": 0.97, "learning_rate": 3.280394729384129e-08, "loss": 1.1165, "step": 35701 }, { "epoch": 0.97, "learning_rate": 3.273240112925846e-08, "loss": 1.2444, "step": 35702 }, { "epoch": 0.98, "learning_rate": 3.266093294389094e-08, "loss": 1.3367, "step": 35703 }, { "epoch": 0.98, "learning_rate": 3.258954273829717e-08, "loss": 1.1541, "step": 35704 }, { "epoch": 0.98, "learning_rate": 3.2518230513035595e-08, "loss": 1.2793, "step": 35705 }, { "epoch": 0.98, "learning_rate": 3.2446996268665766e-08, "loss": 1.1877, "step": 35706 }, { "epoch": 0.98, "learning_rate": 3.237584000574168e-08, "loss": 1.2373, "step": 35707 }, { "epoch": 0.98, "learning_rate": 3.2304761724822885e-08, "loss": 1.1272, "step": 35708 }, { "epoch": 0.98, "learning_rate": 3.223376142646451e-08, "loss": 1.2656, "step": 35709 }, { "epoch": 0.98, "learning_rate": 3.216283911122275e-08, "loss": 1.3142, "step": 35710 }, { "epoch": 0.98, "learning_rate": 3.209199477965053e-08, "loss": 1.0886, "step": 35711 }, { "epoch": 0.98, "learning_rate": 3.202122843230293e-08, "loss": 1.395, "step": 35712 }, { "epoch": 0.98, "learning_rate": 3.195054006973508e-08, "loss": 1.2581, "step": 35713 }, { "epoch": 0.98, "learning_rate": 3.187992969249876e-08, "loss": 0.9302, "step": 35714 }, { "epoch": 0.98, "learning_rate": 3.180939730114574e-08, "loss": 1.1956, "step": 35715 }, { "epoch": 0.98, "learning_rate": 3.173894289623003e-08, "loss": 1.3035, "step": 35716 }, { "epoch": 0.98, "learning_rate": 3.166856647830008e-08, "loss": 1.1462, "step": 35717 }, { "epoch": 0.98, "learning_rate": 3.159826804790766e-08, "loss": 1.2615, "step": 35718 }, { "epoch": 0.98, "learning_rate": 3.152804760560457e-08, "loss": 1.3359, "step": 35719 }, { "epoch": 0.98, "learning_rate": 3.145790515193703e-08, "loss": 1.4102, "step": 35720 }, { "epoch": 0.98, "learning_rate": 3.1387840687455704e-08, "loss": 1.687, "step": 35721 }, { "epoch": 0.98, "learning_rate": 3.1317854212709054e-08, "loss": 1.2207, "step": 35722 }, { "epoch": 0.98, "learning_rate": 3.12479457282433e-08, "loss": 1.3298, "step": 35723 }, { "epoch": 0.98, "learning_rate": 3.117811523460579e-08, "loss": 1.3926, "step": 35724 }, { "epoch": 0.98, "learning_rate": 3.1108362732342747e-08, "loss": 1.2542, "step": 35725 }, { "epoch": 0.98, "learning_rate": 3.1038688222000404e-08, "loss": 1.387, "step": 35726 }, { "epoch": 0.98, "learning_rate": 3.0969091704124986e-08, "loss": 1.2124, "step": 35727 }, { "epoch": 0.98, "learning_rate": 3.089957317925829e-08, "loss": 1.3127, "step": 35728 }, { "epoch": 0.98, "learning_rate": 3.083013264794543e-08, "loss": 1.3008, "step": 35729 }, { "epoch": 0.98, "learning_rate": 3.076077011073042e-08, "loss": 1.4478, "step": 35730 }, { "epoch": 0.98, "learning_rate": 3.0691485568155045e-08, "loss": 1.1846, "step": 35731 }, { "epoch": 0.98, "learning_rate": 3.062227902076109e-08, "loss": 1.1047, "step": 35732 }, { "epoch": 0.98, "learning_rate": 3.055315046909035e-08, "loss": 1.7275, "step": 35733 }, { "epoch": 0.98, "learning_rate": 3.048409991368462e-08, "loss": 1.1709, "step": 35734 }, { "epoch": 0.98, "learning_rate": 3.041512735508345e-08, "loss": 1.2896, "step": 35735 }, { "epoch": 0.98, "learning_rate": 3.034623279382643e-08, "loss": 1.2581, "step": 35736 }, { "epoch": 0.98, "learning_rate": 3.0277416230450885e-08, "loss": 1.186, "step": 35737 }, { "epoch": 0.98, "learning_rate": 3.020867766549862e-08, "loss": 1.1887, "step": 35738 }, { "epoch": 0.98, "learning_rate": 3.0140017099503646e-08, "loss": 1.3279, "step": 35739 }, { "epoch": 0.98, "learning_rate": 3.007143453300665e-08, "loss": 1.272, "step": 35740 }, { "epoch": 0.98, "learning_rate": 3.000292996654164e-08, "loss": 1.3643, "step": 35741 }, { "epoch": 0.98, "learning_rate": 2.993450340064596e-08, "loss": 1.1914, "step": 35742 }, { "epoch": 0.98, "learning_rate": 2.986615483585364e-08, "loss": 1.1624, "step": 35743 }, { "epoch": 0.98, "learning_rate": 2.979788427270203e-08, "loss": 1.2842, "step": 35744 }, { "epoch": 0.98, "learning_rate": 2.9729691711721796e-08, "loss": 1.3501, "step": 35745 }, { "epoch": 0.98, "learning_rate": 2.9661577153449195e-08, "loss": 1.2263, "step": 35746 }, { "epoch": 0.98, "learning_rate": 2.9593540598414906e-08, "loss": 1.2385, "step": 35747 }, { "epoch": 0.98, "learning_rate": 2.9525582047152946e-08, "loss": 1.4343, "step": 35748 }, { "epoch": 0.98, "learning_rate": 2.9457701500194e-08, "loss": 1.3923, "step": 35749 }, { "epoch": 0.98, "learning_rate": 2.9389898958069872e-08, "loss": 1.4707, "step": 35750 }, { "epoch": 0.98, "learning_rate": 2.9322174421310133e-08, "loss": 1.729, "step": 35751 }, { "epoch": 0.98, "learning_rate": 2.9254527890446583e-08, "loss": 1.0555, "step": 35752 }, { "epoch": 0.98, "learning_rate": 2.9186959366005463e-08, "loss": 1.3049, "step": 35753 }, { "epoch": 0.98, "learning_rate": 2.9119468848517463e-08, "loss": 1.3743, "step": 35754 }, { "epoch": 0.98, "learning_rate": 2.905205633851105e-08, "loss": 1.2349, "step": 35755 }, { "epoch": 0.98, "learning_rate": 2.8984721836511354e-08, "loss": 1.1987, "step": 35756 }, { "epoch": 0.98, "learning_rate": 2.8917465343047956e-08, "loss": 1.366, "step": 35757 }, { "epoch": 0.98, "learning_rate": 2.8850286858643773e-08, "loss": 1.2415, "step": 35758 }, { "epoch": 0.98, "learning_rate": 2.8783186383827266e-08, "loss": 1.7363, "step": 35759 }, { "epoch": 0.98, "learning_rate": 2.8716163919122465e-08, "loss": 1.3479, "step": 35760 }, { "epoch": 0.98, "learning_rate": 2.8649219465053392e-08, "loss": 1.1267, "step": 35761 }, { "epoch": 0.98, "learning_rate": 2.858235302214296e-08, "loss": 1.2217, "step": 35762 }, { "epoch": 0.98, "learning_rate": 2.8515564590916312e-08, "loss": 1.3589, "step": 35763 }, { "epoch": 0.98, "learning_rate": 2.8448854171895247e-08, "loss": 1.2341, "step": 35764 }, { "epoch": 0.98, "learning_rate": 2.838222176560046e-08, "loss": 1.3125, "step": 35765 }, { "epoch": 0.98, "learning_rate": 2.8315667372554865e-08, "loss": 1.0559, "step": 35766 }, { "epoch": 0.98, "learning_rate": 2.8249190993278054e-08, "loss": 1.4075, "step": 35767 }, { "epoch": 0.98, "learning_rate": 2.818279262829071e-08, "loss": 1.2488, "step": 35768 }, { "epoch": 0.98, "learning_rate": 2.811647227811243e-08, "loss": 1.1689, "step": 35769 }, { "epoch": 0.98, "learning_rate": 2.8050229943261677e-08, "loss": 1.2683, "step": 35770 }, { "epoch": 0.98, "learning_rate": 2.798406562425582e-08, "loss": 1.3257, "step": 35771 }, { "epoch": 0.98, "learning_rate": 2.7917979321614442e-08, "loss": 1.2988, "step": 35772 }, { "epoch": 0.98, "learning_rate": 2.7851971035853797e-08, "loss": 1.312, "step": 35773 }, { "epoch": 0.98, "learning_rate": 2.778604076748903e-08, "loss": 1.3616, "step": 35774 }, { "epoch": 0.98, "learning_rate": 2.7720188517038615e-08, "loss": 1.2871, "step": 35775 }, { "epoch": 0.98, "learning_rate": 2.7654414285014365e-08, "loss": 1.2812, "step": 35776 }, { "epoch": 0.98, "learning_rate": 2.758871807193364e-08, "loss": 1.1345, "step": 35777 }, { "epoch": 0.98, "learning_rate": 2.7523099878309367e-08, "loss": 1.3215, "step": 35778 }, { "epoch": 0.98, "learning_rate": 2.745755970465447e-08, "loss": 1.2278, "step": 35779 }, { "epoch": 0.98, "learning_rate": 2.7392097551482978e-08, "loss": 1.3818, "step": 35780 }, { "epoch": 0.98, "learning_rate": 2.7326713419305597e-08, "loss": 1.3091, "step": 35781 }, { "epoch": 0.98, "learning_rate": 2.7261407308635247e-08, "loss": 1.2263, "step": 35782 }, { "epoch": 0.98, "learning_rate": 2.7196179219981522e-08, "loss": 1.2356, "step": 35783 }, { "epoch": 0.98, "learning_rate": 2.7131029153855127e-08, "loss": 1.0544, "step": 35784 }, { "epoch": 0.98, "learning_rate": 2.7065957110766762e-08, "loss": 1.2937, "step": 35785 }, { "epoch": 0.98, "learning_rate": 2.7000963091223797e-08, "loss": 1.2192, "step": 35786 }, { "epoch": 0.98, "learning_rate": 2.693604709573694e-08, "loss": 1.0215, "step": 35787 }, { "epoch": 0.98, "learning_rate": 2.687120912481245e-08, "loss": 1.2195, "step": 35788 }, { "epoch": 0.98, "learning_rate": 2.6806449178957693e-08, "loss": 1.3252, "step": 35789 }, { "epoch": 0.98, "learning_rate": 2.6741767258678943e-08, "loss": 1.3567, "step": 35790 }, { "epoch": 0.98, "learning_rate": 2.667716336448356e-08, "loss": 1.375, "step": 35791 }, { "epoch": 0.98, "learning_rate": 2.6612637496875593e-08, "loss": 1.3657, "step": 35792 }, { "epoch": 0.98, "learning_rate": 2.65481896563613e-08, "loss": 1.179, "step": 35793 }, { "epoch": 0.98, "learning_rate": 2.6483819843443615e-08, "loss": 1.311, "step": 35794 }, { "epoch": 0.98, "learning_rate": 2.6419528058626574e-08, "loss": 1.3215, "step": 35795 }, { "epoch": 0.98, "learning_rate": 2.6355314302414225e-08, "loss": 1.4258, "step": 35796 }, { "epoch": 0.98, "learning_rate": 2.6291178575307273e-08, "loss": 1.3024, "step": 35797 }, { "epoch": 0.98, "learning_rate": 2.6227120877807543e-08, "loss": 1.1748, "step": 35798 }, { "epoch": 0.98, "learning_rate": 2.6163141210417965e-08, "loss": 1.175, "step": 35799 }, { "epoch": 0.98, "learning_rate": 2.6099239573637024e-08, "loss": 1.1084, "step": 35800 }, { "epoch": 0.98, "learning_rate": 2.6035415967965437e-08, "loss": 1.1445, "step": 35801 }, { "epoch": 0.98, "learning_rate": 2.5971670393903914e-08, "loss": 1.2688, "step": 35802 }, { "epoch": 0.98, "learning_rate": 2.5908002851948723e-08, "loss": 1.1383, "step": 35803 }, { "epoch": 0.98, "learning_rate": 2.5844413342600573e-08, "loss": 1.3142, "step": 35804 }, { "epoch": 0.98, "learning_rate": 2.5780901866353513e-08, "loss": 1.3281, "step": 35805 }, { "epoch": 0.98, "learning_rate": 2.571746842370826e-08, "loss": 1.0913, "step": 35806 }, { "epoch": 0.98, "learning_rate": 2.5654113015158855e-08, "loss": 1.2092, "step": 35807 }, { "epoch": 0.98, "learning_rate": 2.559083564120046e-08, "loss": 1.1121, "step": 35808 }, { "epoch": 0.98, "learning_rate": 2.552763630232935e-08, "loss": 1.2563, "step": 35809 }, { "epoch": 0.98, "learning_rate": 2.546451499904068e-08, "loss": 1.3481, "step": 35810 }, { "epoch": 0.98, "learning_rate": 2.540147173182739e-08, "loss": 1.2332, "step": 35811 }, { "epoch": 0.98, "learning_rate": 2.5338506501181303e-08, "loss": 1.2317, "step": 35812 }, { "epoch": 0.98, "learning_rate": 2.5275619307596476e-08, "loss": 1.127, "step": 35813 }, { "epoch": 0.98, "learning_rate": 2.5212810151565847e-08, "loss": 1.3689, "step": 35814 }, { "epoch": 0.98, "learning_rate": 2.5150079033579022e-08, "loss": 1.3088, "step": 35815 }, { "epoch": 0.98, "learning_rate": 2.508742595412783e-08, "loss": 1.0608, "step": 35816 }, { "epoch": 0.98, "learning_rate": 2.502485091370188e-08, "loss": 1.3823, "step": 35817 }, { "epoch": 0.98, "learning_rate": 2.496235391279078e-08, "loss": 1.3811, "step": 35818 }, { "epoch": 0.98, "learning_rate": 2.489993495188303e-08, "loss": 1.2175, "step": 35819 }, { "epoch": 0.98, "learning_rate": 2.4837594031468237e-08, "loss": 1.2178, "step": 35820 }, { "epoch": 0.98, "learning_rate": 2.477533115203379e-08, "loss": 1.2725, "step": 35821 }, { "epoch": 0.98, "learning_rate": 2.471314631406596e-08, "loss": 1.3521, "step": 35822 }, { "epoch": 0.98, "learning_rate": 2.4651039518052146e-08, "loss": 1.2373, "step": 35823 }, { "epoch": 0.98, "learning_rate": 2.4589010764477506e-08, "loss": 1.6519, "step": 35824 }, { "epoch": 0.98, "learning_rate": 2.4527060053828323e-08, "loss": 1.262, "step": 35825 }, { "epoch": 0.98, "learning_rate": 2.4465187386587542e-08, "loss": 1.2126, "step": 35826 }, { "epoch": 0.98, "learning_rate": 2.440339276324144e-08, "loss": 1.2834, "step": 35827 }, { "epoch": 0.98, "learning_rate": 2.4341676184271855e-08, "loss": 1.4055, "step": 35828 }, { "epoch": 0.98, "learning_rate": 2.4280037650161736e-08, "loss": 1.3169, "step": 35829 }, { "epoch": 0.98, "learning_rate": 2.4218477161394027e-08, "loss": 1.3193, "step": 35830 }, { "epoch": 0.98, "learning_rate": 2.4156994718449455e-08, "loss": 1.1572, "step": 35831 }, { "epoch": 0.98, "learning_rate": 2.409559032181097e-08, "loss": 1.2527, "step": 35832 }, { "epoch": 0.98, "learning_rate": 2.4034263971955963e-08, "loss": 1.2986, "step": 35833 }, { "epoch": 0.98, "learning_rate": 2.3973015669367383e-08, "loss": 1.2727, "step": 35834 }, { "epoch": 0.98, "learning_rate": 2.3911845414521516e-08, "loss": 1.2305, "step": 35835 }, { "epoch": 0.98, "learning_rate": 2.3850753207899092e-08, "loss": 1.1807, "step": 35836 }, { "epoch": 0.98, "learning_rate": 2.378973904997639e-08, "loss": 1.3926, "step": 35837 }, { "epoch": 0.98, "learning_rate": 2.372880294123303e-08, "loss": 1.1804, "step": 35838 }, { "epoch": 0.98, "learning_rate": 2.3667944882143078e-08, "loss": 1.272, "step": 35839 }, { "epoch": 0.98, "learning_rate": 2.360716487318504e-08, "loss": 1.2271, "step": 35840 }, { "epoch": 0.98, "learning_rate": 2.354646291483187e-08, "loss": 1.2393, "step": 35841 }, { "epoch": 0.98, "learning_rate": 2.348583900756096e-08, "loss": 1.2747, "step": 35842 }, { "epoch": 0.98, "learning_rate": 2.3425293151845274e-08, "loss": 1.2952, "step": 35843 }, { "epoch": 0.98, "learning_rate": 2.336482534815887e-08, "loss": 1.1732, "step": 35844 }, { "epoch": 0.98, "learning_rate": 2.3304435596974707e-08, "loss": 1.1169, "step": 35845 }, { "epoch": 0.98, "learning_rate": 2.3244123898765735e-08, "loss": 1.3721, "step": 35846 }, { "epoch": 0.98, "learning_rate": 2.3183890254002694e-08, "loss": 1.2749, "step": 35847 }, { "epoch": 0.98, "learning_rate": 2.3123734663157427e-08, "loss": 1.1875, "step": 35848 }, { "epoch": 0.98, "learning_rate": 2.3063657126701776e-08, "loss": 1.197, "step": 35849 }, { "epoch": 0.98, "learning_rate": 2.300365764510315e-08, "loss": 1.23, "step": 35850 }, { "epoch": 0.98, "learning_rate": 2.294373621883339e-08, "loss": 1.2146, "step": 35851 }, { "epoch": 0.98, "learning_rate": 2.2883892848358792e-08, "loss": 1.3838, "step": 35852 }, { "epoch": 0.98, "learning_rate": 2.2824127534150088e-08, "loss": 1.3184, "step": 35853 }, { "epoch": 0.98, "learning_rate": 2.2764440276674682e-08, "loss": 1.2344, "step": 35854 }, { "epoch": 0.98, "learning_rate": 2.270483107639776e-08, "loss": 1.3494, "step": 35855 }, { "epoch": 0.98, "learning_rate": 2.2645299933785613e-08, "loss": 1.1899, "step": 35856 }, { "epoch": 0.98, "learning_rate": 2.258584684930676e-08, "loss": 1.0693, "step": 35857 }, { "epoch": 0.98, "learning_rate": 2.2526471823423046e-08, "loss": 1.2136, "step": 35858 }, { "epoch": 0.98, "learning_rate": 2.246717485660188e-08, "loss": 1.4041, "step": 35859 }, { "epoch": 0.98, "learning_rate": 2.2407955949305115e-08, "loss": 1.1587, "step": 35860 }, { "epoch": 0.98, "learning_rate": 2.2348815101995715e-08, "loss": 1.2854, "step": 35861 }, { "epoch": 0.98, "learning_rate": 2.2289752315138856e-08, "loss": 1.3284, "step": 35862 }, { "epoch": 0.98, "learning_rate": 2.223076758919418e-08, "loss": 1.2632, "step": 35863 }, { "epoch": 0.98, "learning_rate": 2.2171860924624643e-08, "loss": 1.4241, "step": 35864 }, { "epoch": 0.98, "learning_rate": 2.2113032321889882e-08, "loss": 1.208, "step": 35865 }, { "epoch": 0.98, "learning_rate": 2.2054281781451746e-08, "loss": 1.1683, "step": 35866 }, { "epoch": 0.98, "learning_rate": 2.199560930376876e-08, "loss": 1.2637, "step": 35867 }, { "epoch": 0.98, "learning_rate": 2.1937014889299446e-08, "loss": 1.2944, "step": 35868 }, { "epoch": 0.98, "learning_rate": 2.1878498538503435e-08, "loss": 1.2749, "step": 35869 }, { "epoch": 0.98, "learning_rate": 2.1820060251838137e-08, "loss": 1.1506, "step": 35870 }, { "epoch": 0.98, "learning_rate": 2.176170002976097e-08, "loss": 1.1892, "step": 35871 }, { "epoch": 0.98, "learning_rate": 2.1703417872727116e-08, "loss": 1.2776, "step": 35872 }, { "epoch": 0.98, "learning_rate": 2.1645213781193997e-08, "loss": 1.3936, "step": 35873 }, { "epoch": 0.98, "learning_rate": 2.15870877556168e-08, "loss": 1.2502, "step": 35874 }, { "epoch": 0.98, "learning_rate": 2.1529039796449602e-08, "loss": 1.6987, "step": 35875 }, { "epoch": 0.98, "learning_rate": 2.14710699041476e-08, "loss": 1.3418, "step": 35876 }, { "epoch": 0.98, "learning_rate": 2.1413178079163767e-08, "loss": 1.3103, "step": 35877 }, { "epoch": 0.98, "learning_rate": 2.1355364321949956e-08, "loss": 1.627, "step": 35878 }, { "epoch": 0.98, "learning_rate": 2.1297628632960253e-08, "loss": 1.2837, "step": 35879 }, { "epoch": 0.98, "learning_rate": 2.1239971012645412e-08, "loss": 1.2866, "step": 35880 }, { "epoch": 0.98, "learning_rate": 2.1182391461457286e-08, "loss": 1.3257, "step": 35881 }, { "epoch": 0.98, "learning_rate": 2.112488997984552e-08, "loss": 1.1841, "step": 35882 }, { "epoch": 0.98, "learning_rate": 2.1067466568259752e-08, "loss": 1.2546, "step": 35883 }, { "epoch": 0.98, "learning_rate": 2.1010121227149626e-08, "loss": 1.2041, "step": 35884 }, { "epoch": 0.98, "learning_rate": 2.095285395696367e-08, "loss": 1.3792, "step": 35885 }, { "epoch": 0.98, "learning_rate": 2.0895664758151523e-08, "loss": 1.3967, "step": 35886 }, { "epoch": 0.98, "learning_rate": 2.0838553631157275e-08, "loss": 1.1433, "step": 35887 }, { "epoch": 0.98, "learning_rate": 2.078152057643057e-08, "loss": 1.1099, "step": 35888 }, { "epoch": 0.98, "learning_rate": 2.072456559441771e-08, "loss": 1.2031, "step": 35889 }, { "epoch": 0.98, "learning_rate": 2.0667688685561683e-08, "loss": 1.4192, "step": 35890 }, { "epoch": 0.98, "learning_rate": 2.0610889850309902e-08, "loss": 1.3232, "step": 35891 }, { "epoch": 0.98, "learning_rate": 2.0554169089105346e-08, "loss": 1.1941, "step": 35892 }, { "epoch": 0.98, "learning_rate": 2.049752640239322e-08, "loss": 1.2964, "step": 35893 }, { "epoch": 0.98, "learning_rate": 2.0440961790614278e-08, "loss": 1.167, "step": 35894 }, { "epoch": 0.98, "learning_rate": 2.038447525421372e-08, "loss": 1.2556, "step": 35895 }, { "epoch": 0.98, "learning_rate": 2.0328066793632307e-08, "loss": 1.2297, "step": 35896 }, { "epoch": 0.98, "learning_rate": 2.0271736409310794e-08, "loss": 1.2495, "step": 35897 }, { "epoch": 0.98, "learning_rate": 2.0215484101689943e-08, "loss": 1.3218, "step": 35898 }, { "epoch": 0.98, "learning_rate": 2.015930987121162e-08, "loss": 1.2759, "step": 35899 }, { "epoch": 0.98, "learning_rate": 2.010321371831325e-08, "loss": 1.2751, "step": 35900 }, { "epoch": 0.98, "learning_rate": 2.0047195643434493e-08, "loss": 1.1843, "step": 35901 }, { "epoch": 0.98, "learning_rate": 1.9991255647013874e-08, "loss": 1.1772, "step": 35902 }, { "epoch": 0.98, "learning_rate": 1.9935393729487716e-08, "loss": 1.2444, "step": 35903 }, { "epoch": 0.98, "learning_rate": 1.987960989129456e-08, "loss": 1.3018, "step": 35904 }, { "epoch": 0.98, "learning_rate": 1.982390413287183e-08, "loss": 1.2251, "step": 35905 }, { "epoch": 0.98, "learning_rate": 1.9768276454652512e-08, "loss": 1.8188, "step": 35906 }, { "epoch": 0.98, "learning_rate": 1.971272685707293e-08, "loss": 1.2649, "step": 35907 }, { "epoch": 0.98, "learning_rate": 1.965725534056828e-08, "loss": 1.77, "step": 35908 }, { "epoch": 0.98, "learning_rate": 1.9601861905572673e-08, "loss": 1.3284, "step": 35909 }, { "epoch": 0.98, "learning_rate": 1.9546546552517974e-08, "loss": 1.6919, "step": 35910 }, { "epoch": 0.98, "learning_rate": 1.949130928183829e-08, "loss": 1.314, "step": 35911 }, { "epoch": 0.98, "learning_rate": 1.943615009396549e-08, "loss": 1.3005, "step": 35912 }, { "epoch": 0.98, "learning_rate": 1.9381068989332562e-08, "loss": 1.3098, "step": 35913 }, { "epoch": 0.98, "learning_rate": 1.9326065968366947e-08, "loss": 1.2454, "step": 35914 }, { "epoch": 0.98, "learning_rate": 1.9271141031501628e-08, "loss": 1.2913, "step": 35915 }, { "epoch": 0.98, "learning_rate": 1.9216294179165153e-08, "loss": 1.1763, "step": 35916 }, { "epoch": 0.98, "learning_rate": 1.9161525411788284e-08, "loss": 1.2175, "step": 35917 }, { "epoch": 0.98, "learning_rate": 1.910683472979735e-08, "loss": 1.2102, "step": 35918 }, { "epoch": 0.98, "learning_rate": 1.905222213362201e-08, "loss": 1.1589, "step": 35919 }, { "epoch": 0.98, "learning_rate": 1.8997687623687477e-08, "loss": 1.1921, "step": 35920 }, { "epoch": 0.98, "learning_rate": 1.8943231200422296e-08, "loss": 1.2148, "step": 35921 }, { "epoch": 0.98, "learning_rate": 1.8888852864251685e-08, "loss": 1.0985, "step": 35922 }, { "epoch": 0.98, "learning_rate": 1.8834552615601966e-08, "loss": 1.2563, "step": 35923 }, { "epoch": 0.98, "learning_rate": 1.8780330454896135e-08, "loss": 1.1519, "step": 35924 }, { "epoch": 0.98, "learning_rate": 1.872618638256052e-08, "loss": 1.1384, "step": 35925 }, { "epoch": 0.98, "learning_rate": 1.8672120399017e-08, "loss": 1.2605, "step": 35926 }, { "epoch": 0.98, "learning_rate": 1.861813250468969e-08, "loss": 1.2698, "step": 35927 }, { "epoch": 0.98, "learning_rate": 1.8564222700000466e-08, "loss": 1.7495, "step": 35928 }, { "epoch": 0.98, "learning_rate": 1.851039098537122e-08, "loss": 1.2192, "step": 35929 }, { "epoch": 0.98, "learning_rate": 1.8456637361222717e-08, "loss": 1.2292, "step": 35930 }, { "epoch": 0.98, "learning_rate": 1.8402961827975742e-08, "loss": 1.0667, "step": 35931 }, { "epoch": 0.98, "learning_rate": 1.834936438604995e-08, "loss": 1.1392, "step": 35932 }, { "epoch": 0.98, "learning_rate": 1.8295845035866122e-08, "loss": 1.2458, "step": 35933 }, { "epoch": 0.98, "learning_rate": 1.82424037778417e-08, "loss": 1.3955, "step": 35934 }, { "epoch": 0.98, "learning_rate": 1.8189040612394128e-08, "loss": 1.3813, "step": 35935 }, { "epoch": 0.98, "learning_rate": 1.813575553994196e-08, "loss": 1.2524, "step": 35936 }, { "epoch": 0.98, "learning_rate": 1.8082548560902636e-08, "loss": 1.2814, "step": 35937 }, { "epoch": 0.98, "learning_rate": 1.8029419675691384e-08, "loss": 1.2866, "step": 35938 }, { "epoch": 0.98, "learning_rate": 1.797636888472343e-08, "loss": 1.1606, "step": 35939 }, { "epoch": 0.98, "learning_rate": 1.79233961884151e-08, "loss": 1.135, "step": 35940 }, { "epoch": 0.98, "learning_rate": 1.78705015871794e-08, "loss": 1.1521, "step": 35941 }, { "epoch": 0.98, "learning_rate": 1.7817685081431557e-08, "loss": 1.2888, "step": 35942 }, { "epoch": 0.98, "learning_rate": 1.776494667158457e-08, "loss": 1.324, "step": 35943 }, { "epoch": 0.98, "learning_rate": 1.7712286358050335e-08, "loss": 1.4097, "step": 35944 }, { "epoch": 0.98, "learning_rate": 1.765970414124074e-08, "loss": 1.3291, "step": 35945 }, { "epoch": 0.98, "learning_rate": 1.7607200021567683e-08, "loss": 1.2683, "step": 35946 }, { "epoch": 0.98, "learning_rate": 1.7554773999443054e-08, "loss": 1.293, "step": 35947 }, { "epoch": 0.98, "learning_rate": 1.7502426075274303e-08, "loss": 1.3132, "step": 35948 }, { "epoch": 0.98, "learning_rate": 1.7450156249473326e-08, "loss": 1.3157, "step": 35949 }, { "epoch": 0.98, "learning_rate": 1.7397964522447576e-08, "loss": 1.2017, "step": 35950 }, { "epoch": 0.98, "learning_rate": 1.734585089460672e-08, "loss": 1.2979, "step": 35951 }, { "epoch": 0.98, "learning_rate": 1.7293815366357102e-08, "loss": 1.2439, "step": 35952 }, { "epoch": 0.98, "learning_rate": 1.7241857938107287e-08, "loss": 1.2456, "step": 35953 }, { "epoch": 0.98, "learning_rate": 1.7189978610262502e-08, "loss": 1.1477, "step": 35954 }, { "epoch": 0.98, "learning_rate": 1.713817738322798e-08, "loss": 1.0659, "step": 35955 }, { "epoch": 0.98, "learning_rate": 1.7086454257412288e-08, "loss": 1.176, "step": 35956 }, { "epoch": 0.98, "learning_rate": 1.703480923321621e-08, "loss": 1.0439, "step": 35957 }, { "epoch": 0.98, "learning_rate": 1.6983242311046087e-08, "loss": 1.2183, "step": 35958 }, { "epoch": 0.98, "learning_rate": 1.6931753491303825e-08, "loss": 1.2512, "step": 35959 }, { "epoch": 0.98, "learning_rate": 1.6880342774394654e-08, "loss": 1.3325, "step": 35960 }, { "epoch": 0.98, "learning_rate": 1.682901016071825e-08, "loss": 1.105, "step": 35961 }, { "epoch": 0.98, "learning_rate": 1.677775565067763e-08, "loss": 1.3162, "step": 35962 }, { "epoch": 0.98, "learning_rate": 1.672657924467358e-08, "loss": 1.2771, "step": 35963 }, { "epoch": 0.98, "learning_rate": 1.6675480943105783e-08, "loss": 1.2346, "step": 35964 }, { "epoch": 0.98, "learning_rate": 1.6624460746375028e-08, "loss": 1.2292, "step": 35965 }, { "epoch": 0.98, "learning_rate": 1.6573518654879882e-08, "loss": 1.3232, "step": 35966 }, { "epoch": 0.98, "learning_rate": 1.6522654669018922e-08, "loss": 1.1235, "step": 35967 }, { "epoch": 0.98, "learning_rate": 1.6471868789189604e-08, "loss": 1.3687, "step": 35968 }, { "epoch": 0.98, "learning_rate": 1.6421161015790498e-08, "loss": 1.2703, "step": 35969 }, { "epoch": 0.98, "learning_rate": 1.6370531349216845e-08, "loss": 1.0435, "step": 35970 }, { "epoch": 0.98, "learning_rate": 1.63199797898661e-08, "loss": 1.3608, "step": 35971 }, { "epoch": 0.98, "learning_rate": 1.6269506338133512e-08, "loss": 1.2739, "step": 35972 }, { "epoch": 0.98, "learning_rate": 1.6219110994413202e-08, "loss": 1.2168, "step": 35973 }, { "epoch": 0.98, "learning_rate": 1.616879375910041e-08, "loss": 1.2576, "step": 35974 }, { "epoch": 0.98, "learning_rate": 1.6118554632587045e-08, "loss": 1.2478, "step": 35975 }, { "epoch": 0.98, "learning_rate": 1.6068393615268353e-08, "loss": 1.2783, "step": 35976 }, { "epoch": 0.98, "learning_rate": 1.6018310707536234e-08, "loss": 1.3564, "step": 35977 }, { "epoch": 0.98, "learning_rate": 1.596830590978038e-08, "loss": 1.2224, "step": 35978 }, { "epoch": 0.98, "learning_rate": 1.5918379222394918e-08, "loss": 1.1729, "step": 35979 }, { "epoch": 0.98, "learning_rate": 1.5868530645769542e-08, "loss": 1.2954, "step": 35980 }, { "epoch": 0.98, "learning_rate": 1.5818760180292826e-08, "loss": 1.3347, "step": 35981 }, { "epoch": 0.98, "learning_rate": 1.5769067826355565e-08, "loss": 1.2773, "step": 35982 }, { "epoch": 0.98, "learning_rate": 1.5719453584346344e-08, "loss": 1.2759, "step": 35983 }, { "epoch": 0.98, "learning_rate": 1.566991745465374e-08, "loss": 1.3022, "step": 35984 }, { "epoch": 0.98, "learning_rate": 1.5620459437664105e-08, "loss": 1.3618, "step": 35985 }, { "epoch": 0.98, "learning_rate": 1.557107953376491e-08, "loss": 1.248, "step": 35986 }, { "epoch": 0.98, "learning_rate": 1.5521777743342516e-08, "loss": 1.1981, "step": 35987 }, { "epoch": 0.98, "learning_rate": 1.5472554066783273e-08, "loss": 1.3474, "step": 35988 }, { "epoch": 0.98, "learning_rate": 1.5423408504471326e-08, "loss": 1.1875, "step": 35989 }, { "epoch": 0.98, "learning_rate": 1.537434105679192e-08, "loss": 1.209, "step": 35990 }, { "epoch": 0.98, "learning_rate": 1.532535172412808e-08, "loss": 1.3579, "step": 35991 }, { "epoch": 0.98, "learning_rate": 1.5276440506863942e-08, "loss": 1.165, "step": 35992 }, { "epoch": 0.98, "learning_rate": 1.5227607405381428e-08, "loss": 1.1968, "step": 35993 }, { "epoch": 0.98, "learning_rate": 1.517885242006245e-08, "loss": 1.3091, "step": 35994 }, { "epoch": 0.98, "learning_rate": 1.5130175551290037e-08, "loss": 1.1116, "step": 35995 }, { "epoch": 0.98, "learning_rate": 1.5081576799443886e-08, "loss": 1.3442, "step": 35996 }, { "epoch": 0.98, "learning_rate": 1.503305616490369e-08, "loss": 1.1731, "step": 35997 }, { "epoch": 0.98, "learning_rate": 1.4984613648049152e-08, "loss": 1.2949, "step": 35998 }, { "epoch": 0.98, "learning_rate": 1.493624924926107e-08, "loss": 1.3201, "step": 35999 }, { "epoch": 0.98, "learning_rate": 1.4887962968914704e-08, "loss": 1.1506, "step": 36000 }, { "epoch": 0.98, "learning_rate": 1.4839754807390861e-08, "loss": 1.3074, "step": 36001 }, { "epoch": 0.98, "learning_rate": 1.4791624765064793e-08, "loss": 1.2292, "step": 36002 }, { "epoch": 0.98, "learning_rate": 1.474357284231509e-08, "loss": 1.1318, "step": 36003 }, { "epoch": 0.98, "learning_rate": 1.4695599039514784e-08, "loss": 1.2124, "step": 36004 }, { "epoch": 0.98, "learning_rate": 1.4647703357041354e-08, "loss": 1.2209, "step": 36005 }, { "epoch": 0.98, "learning_rate": 1.4599885795267832e-08, "loss": 1.1665, "step": 36006 }, { "epoch": 0.98, "learning_rate": 1.4552146354570585e-08, "loss": 1.3574, "step": 36007 }, { "epoch": 0.98, "learning_rate": 1.4504485035321536e-08, "loss": 1.3191, "step": 36008 }, { "epoch": 0.98, "learning_rate": 1.4456901837893721e-08, "loss": 1.3306, "step": 36009 }, { "epoch": 0.98, "learning_rate": 1.4409396762659066e-08, "loss": 1.3123, "step": 36010 }, { "epoch": 0.98, "learning_rate": 1.4361969809990607e-08, "loss": 1.2502, "step": 36011 }, { "epoch": 0.98, "learning_rate": 1.4314620980258042e-08, "loss": 1.1919, "step": 36012 }, { "epoch": 0.98, "learning_rate": 1.4267350273832193e-08, "loss": 1.3843, "step": 36013 }, { "epoch": 0.98, "learning_rate": 1.422015769108387e-08, "loss": 1.3044, "step": 36014 }, { "epoch": 0.98, "learning_rate": 1.4173043232380557e-08, "loss": 1.1091, "step": 36015 }, { "epoch": 0.98, "learning_rate": 1.412600689809196e-08, "loss": 1.1244, "step": 36016 }, { "epoch": 0.98, "learning_rate": 1.4079048688585562e-08, "loss": 1.3147, "step": 36017 }, { "epoch": 0.98, "learning_rate": 1.4032168604228847e-08, "loss": 1.2808, "step": 36018 }, { "epoch": 0.98, "learning_rate": 1.3985366645389298e-08, "loss": 1.1831, "step": 36019 }, { "epoch": 0.98, "learning_rate": 1.3938642812432179e-08, "loss": 1.2334, "step": 36020 }, { "epoch": 0.98, "learning_rate": 1.3891997105722755e-08, "loss": 1.1592, "step": 36021 }, { "epoch": 0.98, "learning_rate": 1.3845429525627396e-08, "loss": 1.283, "step": 36022 }, { "epoch": 0.98, "learning_rate": 1.3798940072509148e-08, "loss": 1.2124, "step": 36023 }, { "epoch": 0.98, "learning_rate": 1.3752528746733274e-08, "loss": 1.2595, "step": 36024 }, { "epoch": 0.98, "learning_rate": 1.3706195548660595e-08, "loss": 1.3838, "step": 36025 }, { "epoch": 0.98, "learning_rate": 1.3659940478654155e-08, "loss": 1.2562, "step": 36026 }, { "epoch": 0.98, "learning_rate": 1.3613763537078106e-08, "loss": 1.271, "step": 36027 }, { "epoch": 0.98, "learning_rate": 1.3567664724289942e-08, "loss": 1.1504, "step": 36028 }, { "epoch": 0.98, "learning_rate": 1.3521644040653814e-08, "loss": 1.2805, "step": 36029 }, { "epoch": 0.98, "learning_rate": 1.3475701486528325e-08, "loss": 1.354, "step": 36030 }, { "epoch": 0.98, "learning_rate": 1.3429837062273188e-08, "loss": 1.3682, "step": 36031 }, { "epoch": 0.98, "learning_rate": 1.3384050768247004e-08, "loss": 1.2297, "step": 36032 }, { "epoch": 0.98, "learning_rate": 1.3338342604807264e-08, "loss": 1.283, "step": 36033 }, { "epoch": 0.98, "learning_rate": 1.3292712572312572e-08, "loss": 1.2656, "step": 36034 }, { "epoch": 0.98, "learning_rate": 1.3247160671119308e-08, "loss": 1.1648, "step": 36035 }, { "epoch": 0.98, "learning_rate": 1.3201686901584965e-08, "loss": 1.2886, "step": 36036 }, { "epoch": 0.98, "learning_rate": 1.3156291264063703e-08, "loss": 1.3611, "step": 36037 }, { "epoch": 0.98, "learning_rate": 1.3110973758911905e-08, "loss": 1.2754, "step": 36038 }, { "epoch": 0.98, "learning_rate": 1.306573438648373e-08, "loss": 1.6182, "step": 36039 }, { "epoch": 0.98, "learning_rate": 1.3020573147132231e-08, "loss": 1.2957, "step": 36040 }, { "epoch": 0.98, "learning_rate": 1.2975490041212679e-08, "loss": 1.2021, "step": 36041 }, { "epoch": 0.98, "learning_rate": 1.2930485069075904e-08, "loss": 1.2532, "step": 36042 }, { "epoch": 0.98, "learning_rate": 1.2885558231076067e-08, "loss": 1.1909, "step": 36043 }, { "epoch": 0.98, "learning_rate": 1.284070952756178e-08, "loss": 1.2747, "step": 36044 }, { "epoch": 0.98, "learning_rate": 1.2795938958886089e-08, "loss": 1.2532, "step": 36045 }, { "epoch": 0.98, "learning_rate": 1.275124652539872e-08, "loss": 1.1438, "step": 36046 }, { "epoch": 0.98, "learning_rate": 1.270663222744939e-08, "loss": 1.21, "step": 36047 }, { "epoch": 0.98, "learning_rate": 1.2662096065386709e-08, "loss": 1.1765, "step": 36048 }, { "epoch": 0.98, "learning_rate": 1.2617638039559287e-08, "loss": 1.6082, "step": 36049 }, { "epoch": 0.98, "learning_rate": 1.2573258150315736e-08, "loss": 1.3225, "step": 36050 }, { "epoch": 0.98, "learning_rate": 1.2528956398001335e-08, "loss": 1.1702, "step": 36051 }, { "epoch": 0.98, "learning_rate": 1.2484732782964693e-08, "loss": 1.2764, "step": 36052 }, { "epoch": 0.98, "learning_rate": 1.2440587305551088e-08, "loss": 1.2539, "step": 36053 }, { "epoch": 0.98, "learning_rate": 1.2396519966105802e-08, "loss": 1.2957, "step": 36054 }, { "epoch": 0.98, "learning_rate": 1.2352530764974113e-08, "loss": 1.1746, "step": 36055 }, { "epoch": 0.98, "learning_rate": 1.230861970249908e-08, "loss": 1.2012, "step": 36056 }, { "epoch": 0.98, "learning_rate": 1.2264786779024873e-08, "loss": 1.2001, "step": 36057 }, { "epoch": 0.98, "learning_rate": 1.222103199489455e-08, "loss": 1.262, "step": 36058 }, { "epoch": 0.98, "learning_rate": 1.217735535045117e-08, "loss": 1.3257, "step": 36059 }, { "epoch": 0.98, "learning_rate": 1.213375684603446e-08, "loss": 1.2185, "step": 36060 }, { "epoch": 0.98, "learning_rate": 1.2090236481986372e-08, "loss": 1.1227, "step": 36061 }, { "epoch": 0.98, "learning_rate": 1.2046794258648853e-08, "loss": 1.2522, "step": 36062 }, { "epoch": 0.98, "learning_rate": 1.200343017635941e-08, "loss": 1.3513, "step": 36063 }, { "epoch": 0.98, "learning_rate": 1.1960144235458881e-08, "loss": 1.2795, "step": 36064 }, { "epoch": 0.98, "learning_rate": 1.1916936436285887e-08, "loss": 1.2354, "step": 36065 }, { "epoch": 0.98, "learning_rate": 1.1873806779176822e-08, "loss": 1.3115, "step": 36066 }, { "epoch": 0.98, "learning_rate": 1.1830755264471416e-08, "loss": 1.2244, "step": 36067 }, { "epoch": 0.98, "learning_rate": 1.1787781892504957e-08, "loss": 1.2644, "step": 36068 }, { "epoch": 0.99, "learning_rate": 1.1744886663614951e-08, "loss": 1.3062, "step": 36069 }, { "epoch": 0.99, "learning_rate": 1.1702069578135577e-08, "loss": 1.3652, "step": 36070 }, { "epoch": 0.99, "learning_rate": 1.1659330636402123e-08, "loss": 1.3169, "step": 36071 }, { "epoch": 0.99, "learning_rate": 1.1616669838748763e-08, "loss": 1.1848, "step": 36072 }, { "epoch": 0.99, "learning_rate": 1.1574087185510785e-08, "loss": 1.3513, "step": 36073 }, { "epoch": 0.99, "learning_rate": 1.1531582677020148e-08, "loss": 1.3186, "step": 36074 }, { "epoch": 0.99, "learning_rate": 1.1489156313608807e-08, "loss": 1.3608, "step": 36075 }, { "epoch": 0.99, "learning_rate": 1.144680809560983e-08, "loss": 1.416, "step": 36076 }, { "epoch": 0.99, "learning_rate": 1.1404538023354062e-08, "loss": 1.6348, "step": 36077 }, { "epoch": 0.99, "learning_rate": 1.136234609717235e-08, "loss": 1.1567, "step": 36078 }, { "epoch": 0.99, "learning_rate": 1.1320232317394431e-08, "loss": 1.2756, "step": 36079 }, { "epoch": 0.99, "learning_rate": 1.127819668435004e-08, "loss": 1.2844, "step": 36080 }, { "epoch": 0.99, "learning_rate": 1.1236239198367805e-08, "loss": 1.1919, "step": 36081 }, { "epoch": 0.99, "learning_rate": 1.1194359859776349e-08, "loss": 1.2498, "step": 36082 }, { "epoch": 0.99, "learning_rate": 1.1152558668903191e-08, "loss": 1.4124, "step": 36083 }, { "epoch": 0.99, "learning_rate": 1.1110835626075845e-08, "loss": 1.2327, "step": 36084 }, { "epoch": 0.99, "learning_rate": 1.1069190731619605e-08, "loss": 1.3179, "step": 36085 }, { "epoch": 0.99, "learning_rate": 1.102762398586088e-08, "loss": 1.2668, "step": 36086 }, { "epoch": 0.99, "learning_rate": 1.0986135389124964e-08, "loss": 1.1306, "step": 36087 }, { "epoch": 0.99, "learning_rate": 1.094472494173604e-08, "loss": 1.2542, "step": 36088 }, { "epoch": 0.99, "learning_rate": 1.0903392644018295e-08, "loss": 1.2483, "step": 36089 }, { "epoch": 0.99, "learning_rate": 1.0862138496295916e-08, "loss": 1.2004, "step": 36090 }, { "epoch": 0.99, "learning_rate": 1.0820962498890863e-08, "loss": 1.1809, "step": 36091 }, { "epoch": 0.99, "learning_rate": 1.0779864652125105e-08, "loss": 1.26, "step": 36092 }, { "epoch": 0.99, "learning_rate": 1.0738844956320605e-08, "loss": 1.2939, "step": 36093 }, { "epoch": 0.99, "learning_rate": 1.0697903411798216e-08, "loss": 1.282, "step": 36094 }, { "epoch": 0.99, "learning_rate": 1.0657040018877685e-08, "loss": 1.3125, "step": 36095 }, { "epoch": 0.99, "learning_rate": 1.0616254777879864e-08, "loss": 1.1816, "step": 36096 }, { "epoch": 0.99, "learning_rate": 1.0575547689122278e-08, "loss": 1.1736, "step": 36097 }, { "epoch": 0.99, "learning_rate": 1.0534918752924672e-08, "loss": 1.2834, "step": 36098 }, { "epoch": 0.99, "learning_rate": 1.0494367969604568e-08, "loss": 1.177, "step": 36099 }, { "epoch": 0.99, "learning_rate": 1.0453895339478381e-08, "loss": 1.4509, "step": 36100 }, { "epoch": 0.99, "learning_rate": 1.0413500862864745e-08, "loss": 1.2373, "step": 36101 }, { "epoch": 0.99, "learning_rate": 1.0373184540077852e-08, "loss": 1.085, "step": 36102 }, { "epoch": 0.99, "learning_rate": 1.0332946371433007e-08, "loss": 1.4121, "step": 36103 }, { "epoch": 0.99, "learning_rate": 1.029278635724662e-08, "loss": 1.2756, "step": 36104 }, { "epoch": 0.99, "learning_rate": 1.0252704497831779e-08, "loss": 1.2954, "step": 36105 }, { "epoch": 0.99, "learning_rate": 1.0212700793502672e-08, "loss": 1.2527, "step": 36106 }, { "epoch": 0.99, "learning_rate": 1.0172775244571276e-08, "loss": 1.2549, "step": 36107 }, { "epoch": 0.99, "learning_rate": 1.0132927851350672e-08, "loss": 1.1204, "step": 36108 }, { "epoch": 0.99, "learning_rate": 1.0093158614152831e-08, "loss": 1.2463, "step": 36109 }, { "epoch": 0.99, "learning_rate": 1.0053467533287509e-08, "loss": 1.2815, "step": 36110 }, { "epoch": 0.99, "learning_rate": 1.0013854609066675e-08, "loss": 1.3909, "step": 36111 }, { "epoch": 0.99, "learning_rate": 9.974319841800085e-09, "loss": 1.2368, "step": 36112 }, { "epoch": 0.99, "learning_rate": 9.934863231797487e-09, "loss": 1.3188, "step": 36113 }, { "epoch": 0.99, "learning_rate": 9.895484779366416e-09, "loss": 1.4351, "step": 36114 }, { "epoch": 0.99, "learning_rate": 9.856184484814402e-09, "loss": 1.3162, "step": 36115 }, { "epoch": 0.99, "learning_rate": 9.816962348451199e-09, "loss": 1.2664, "step": 36116 }, { "epoch": 0.99, "learning_rate": 9.777818370581005e-09, "loss": 1.3281, "step": 36117 }, { "epoch": 0.99, "learning_rate": 9.738752551512465e-09, "loss": 1.1672, "step": 36118 }, { "epoch": 0.99, "learning_rate": 9.69976489154978e-09, "loss": 1.4272, "step": 36119 }, { "epoch": 0.99, "learning_rate": 9.660855390998258e-09, "loss": 1.228, "step": 36120 }, { "epoch": 0.99, "learning_rate": 9.622024050163215e-09, "loss": 1.3164, "step": 36121 }, { "epoch": 0.99, "learning_rate": 9.583270869346628e-09, "loss": 1.4324, "step": 36122 }, { "epoch": 0.99, "learning_rate": 9.54459584885381e-09, "loss": 1.1353, "step": 36123 }, { "epoch": 0.99, "learning_rate": 9.505998988985632e-09, "loss": 1.2634, "step": 36124 }, { "epoch": 0.99, "learning_rate": 9.467480290044073e-09, "loss": 1.2205, "step": 36125 }, { "epoch": 0.99, "learning_rate": 9.429039752332226e-09, "loss": 1.2825, "step": 36126 }, { "epoch": 0.99, "learning_rate": 9.390677376148738e-09, "loss": 1.2234, "step": 36127 }, { "epoch": 0.99, "learning_rate": 9.352393161794483e-09, "loss": 1.1157, "step": 36128 }, { "epoch": 0.99, "learning_rate": 9.314187109570327e-09, "loss": 1.3025, "step": 36129 }, { "epoch": 0.99, "learning_rate": 9.276059219773814e-09, "loss": 1.2507, "step": 36130 }, { "epoch": 0.99, "learning_rate": 9.238009492702481e-09, "loss": 1.155, "step": 36131 }, { "epoch": 0.99, "learning_rate": 9.200037928654981e-09, "loss": 1.2224, "step": 36132 }, { "epoch": 0.99, "learning_rate": 9.162144527929961e-09, "loss": 0.9895, "step": 36133 }, { "epoch": 0.99, "learning_rate": 9.124329290820522e-09, "loss": 1.3853, "step": 36134 }, { "epoch": 0.99, "learning_rate": 9.086592217625313e-09, "loss": 1.2017, "step": 36135 }, { "epoch": 0.99, "learning_rate": 9.04893330863854e-09, "loss": 1.2764, "step": 36136 }, { "epoch": 0.99, "learning_rate": 9.011352564154418e-09, "loss": 1.3872, "step": 36137 }, { "epoch": 0.99, "learning_rate": 8.973849984467153e-09, "loss": 1.3173, "step": 36138 }, { "epoch": 0.99, "learning_rate": 8.936425569870955e-09, "loss": 1.3003, "step": 36139 }, { "epoch": 0.99, "learning_rate": 8.899079320657811e-09, "loss": 1.3562, "step": 36140 }, { "epoch": 0.99, "learning_rate": 8.861811237119711e-09, "loss": 1.4434, "step": 36141 }, { "epoch": 0.99, "learning_rate": 8.824621319549753e-09, "loss": 1.3596, "step": 36142 }, { "epoch": 0.99, "learning_rate": 8.787509568236597e-09, "loss": 1.7236, "step": 36143 }, { "epoch": 0.99, "learning_rate": 8.750475983472228e-09, "loss": 1.3047, "step": 36144 }, { "epoch": 0.99, "learning_rate": 8.713520565546418e-09, "loss": 1.1929, "step": 36145 }, { "epoch": 0.99, "learning_rate": 8.676643314746714e-09, "loss": 1.2808, "step": 36146 }, { "epoch": 0.99, "learning_rate": 8.639844231363992e-09, "loss": 1.2932, "step": 36147 }, { "epoch": 0.99, "learning_rate": 8.603123315683582e-09, "loss": 1.1887, "step": 36148 }, { "epoch": 0.99, "learning_rate": 8.56648056799525e-09, "loss": 1.2205, "step": 36149 }, { "epoch": 0.99, "learning_rate": 8.529915988583216e-09, "loss": 1.0234, "step": 36150 }, { "epoch": 0.99, "learning_rate": 8.493429577736134e-09, "loss": 1.3296, "step": 36151 }, { "epoch": 0.99, "learning_rate": 8.457021335737115e-09, "loss": 1.2124, "step": 36152 }, { "epoch": 0.99, "learning_rate": 8.420691262872593e-09, "loss": 1.1469, "step": 36153 }, { "epoch": 0.99, "learning_rate": 8.384439359425678e-09, "loss": 1.1548, "step": 36154 }, { "epoch": 0.99, "learning_rate": 8.348265625680585e-09, "loss": 1.2327, "step": 36155 }, { "epoch": 0.99, "learning_rate": 8.312170061920421e-09, "loss": 1.2961, "step": 36156 }, { "epoch": 0.99, "learning_rate": 8.276152668428294e-09, "loss": 1.0842, "step": 36157 }, { "epoch": 0.99, "learning_rate": 8.24021344548398e-09, "loss": 1.2742, "step": 36158 }, { "epoch": 0.99, "learning_rate": 8.204352393369474e-09, "loss": 1.3792, "step": 36159 }, { "epoch": 0.99, "learning_rate": 8.168569512366776e-09, "loss": 1.3098, "step": 36160 }, { "epoch": 0.99, "learning_rate": 8.132864802754547e-09, "loss": 1.3176, "step": 36161 }, { "epoch": 0.99, "learning_rate": 8.097238264811458e-09, "loss": 1.1433, "step": 36162 }, { "epoch": 0.99, "learning_rate": 8.061689898817282e-09, "loss": 1.2986, "step": 36163 }, { "epoch": 0.99, "learning_rate": 8.026219705050686e-09, "loss": 1.2783, "step": 36164 }, { "epoch": 0.99, "learning_rate": 7.990827683787005e-09, "loss": 1.3225, "step": 36165 }, { "epoch": 0.99, "learning_rate": 7.955513835306016e-09, "loss": 1.2756, "step": 36166 }, { "epoch": 0.99, "learning_rate": 7.920278159881944e-09, "loss": 1.1313, "step": 36167 }, { "epoch": 0.99, "learning_rate": 7.885120657790124e-09, "loss": 1.1321, "step": 36168 }, { "epoch": 0.99, "learning_rate": 7.850041329307002e-09, "loss": 1.0718, "step": 36169 }, { "epoch": 0.99, "learning_rate": 7.815040174707911e-09, "loss": 1.1409, "step": 36170 }, { "epoch": 0.99, "learning_rate": 7.780117194263747e-09, "loss": 1.0112, "step": 36171 }, { "epoch": 0.99, "learning_rate": 7.745272388249846e-09, "loss": 1.4307, "step": 36172 }, { "epoch": 0.99, "learning_rate": 7.710505756938213e-09, "loss": 1.46, "step": 36173 }, { "epoch": 0.99, "learning_rate": 7.675817300600852e-09, "loss": 1.345, "step": 36174 }, { "epoch": 0.99, "learning_rate": 7.641207019508656e-09, "loss": 1.2129, "step": 36175 }, { "epoch": 0.99, "learning_rate": 7.606674913933631e-09, "loss": 1.1716, "step": 36176 }, { "epoch": 0.99, "learning_rate": 7.572220984144452e-09, "loss": 1.3274, "step": 36177 }, { "epoch": 0.99, "learning_rate": 7.537845230412011e-09, "loss": 1.436, "step": 36178 }, { "epoch": 0.99, "learning_rate": 7.503547653003873e-09, "loss": 1.5723, "step": 36179 }, { "epoch": 0.99, "learning_rate": 7.469328252190932e-09, "loss": 1.3711, "step": 36180 }, { "epoch": 0.99, "learning_rate": 7.4351870282374225e-09, "loss": 1.271, "step": 36181 }, { "epoch": 0.99, "learning_rate": 7.401123981413128e-09, "loss": 1.2461, "step": 36182 }, { "epoch": 0.99, "learning_rate": 7.36713911198339e-09, "loss": 1.2094, "step": 36183 }, { "epoch": 0.99, "learning_rate": 7.3332324202146645e-09, "loss": 1.2095, "step": 36184 }, { "epoch": 0.99, "learning_rate": 7.299403906371183e-09, "loss": 1.1309, "step": 36185 }, { "epoch": 0.99, "learning_rate": 7.265653570718289e-09, "loss": 1.3142, "step": 36186 }, { "epoch": 0.99, "learning_rate": 7.231981413520217e-09, "loss": 1.1587, "step": 36187 }, { "epoch": 0.99, "learning_rate": 7.198387435040088e-09, "loss": 1.2307, "step": 36188 }, { "epoch": 0.99, "learning_rate": 7.164871635541026e-09, "loss": 1.5479, "step": 36189 }, { "epoch": 0.99, "learning_rate": 7.131434015285043e-09, "loss": 1.7476, "step": 36190 }, { "epoch": 0.99, "learning_rate": 7.098074574533043e-09, "loss": 1.1038, "step": 36191 }, { "epoch": 0.99, "learning_rate": 7.064793313548146e-09, "loss": 1.1338, "step": 36192 }, { "epoch": 0.99, "learning_rate": 7.031590232587926e-09, "loss": 1.3188, "step": 36193 }, { "epoch": 0.99, "learning_rate": 6.998465331914394e-09, "loss": 1.2734, "step": 36194 }, { "epoch": 0.99, "learning_rate": 6.965418611785124e-09, "loss": 1.3945, "step": 36195 }, { "epoch": 0.99, "learning_rate": 6.932450072459907e-09, "loss": 1.2665, "step": 36196 }, { "epoch": 0.99, "learning_rate": 6.8995597141963136e-09, "loss": 1.2485, "step": 36197 }, { "epoch": 0.99, "learning_rate": 6.866747537250806e-09, "loss": 1.21, "step": 36198 }, { "epoch": 0.99, "learning_rate": 6.834013541880957e-09, "loss": 1.1804, "step": 36199 }, { "epoch": 0.99, "learning_rate": 6.801357728343228e-09, "loss": 1.3169, "step": 36200 }, { "epoch": 0.99, "learning_rate": 6.768780096891858e-09, "loss": 1.2952, "step": 36201 }, { "epoch": 0.99, "learning_rate": 6.736280647782201e-09, "loss": 1.2825, "step": 36202 }, { "epoch": 0.99, "learning_rate": 6.703859381269607e-09, "loss": 1.1948, "step": 36203 }, { "epoch": 0.99, "learning_rate": 6.671516297606095e-09, "loss": 1.304, "step": 36204 }, { "epoch": 0.99, "learning_rate": 6.6392513970459096e-09, "loss": 1.2085, "step": 36205 }, { "epoch": 0.99, "learning_rate": 6.607064679841068e-09, "loss": 1.3179, "step": 36206 }, { "epoch": 0.99, "learning_rate": 6.5749561462424835e-09, "loss": 1.3428, "step": 36207 }, { "epoch": 0.99, "learning_rate": 6.542925796503286e-09, "loss": 1.3071, "step": 36208 }, { "epoch": 0.99, "learning_rate": 6.510973630872164e-09, "loss": 1.3018, "step": 36209 }, { "epoch": 0.99, "learning_rate": 6.479099649601139e-09, "loss": 1.1261, "step": 36210 }, { "epoch": 0.99, "learning_rate": 6.447303852936681e-09, "loss": 1.1199, "step": 36211 }, { "epoch": 0.99, "learning_rate": 6.415586241130811e-09, "loss": 1.1279, "step": 36212 }, { "epoch": 0.99, "learning_rate": 6.383946814428888e-09, "loss": 1.3379, "step": 36213 }, { "epoch": 0.99, "learning_rate": 6.352385573079601e-09, "loss": 1.1431, "step": 36214 }, { "epoch": 0.99, "learning_rate": 6.320902517330529e-09, "loss": 1.1726, "step": 36215 }, { "epoch": 0.99, "learning_rate": 6.289497647427034e-09, "loss": 1.2698, "step": 36216 }, { "epoch": 0.99, "learning_rate": 6.258170963615584e-09, "loss": 1.3918, "step": 36217 }, { "epoch": 0.99, "learning_rate": 6.226922466140428e-09, "loss": 1.3125, "step": 36218 }, { "epoch": 0.99, "learning_rate": 6.195752155246926e-09, "loss": 1.386, "step": 36219 }, { "epoch": 0.99, "learning_rate": 6.164660031178216e-09, "loss": 1.2368, "step": 36220 }, { "epoch": 0.99, "learning_rate": 6.133646094177437e-09, "loss": 1.2368, "step": 36221 }, { "epoch": 0.99, "learning_rate": 6.1027103444877276e-09, "loss": 1.2344, "step": 36222 }, { "epoch": 0.99, "learning_rate": 6.071852782351117e-09, "loss": 1.2688, "step": 36223 }, { "epoch": 0.99, "learning_rate": 6.041073408008524e-09, "loss": 1.0911, "step": 36224 }, { "epoch": 0.99, "learning_rate": 6.010372221700867e-09, "loss": 1.2473, "step": 36225 }, { "epoch": 0.99, "learning_rate": 5.9797492236690626e-09, "loss": 1.332, "step": 36226 }, { "epoch": 0.99, "learning_rate": 5.94920441415292e-09, "loss": 1.1907, "step": 36227 }, { "epoch": 0.99, "learning_rate": 5.918737793388918e-09, "loss": 1.0232, "step": 36228 }, { "epoch": 0.99, "learning_rate": 5.8883493616179734e-09, "loss": 1.2654, "step": 36229 }, { "epoch": 0.99, "learning_rate": 5.8580391190776746e-09, "loss": 1.3247, "step": 36230 }, { "epoch": 0.99, "learning_rate": 5.827807066003388e-09, "loss": 1.2461, "step": 36231 }, { "epoch": 0.99, "learning_rate": 5.797653202633813e-09, "loss": 1.2756, "step": 36232 }, { "epoch": 0.99, "learning_rate": 5.7675775292032055e-09, "loss": 1.2756, "step": 36233 }, { "epoch": 0.99, "learning_rate": 5.737580045946933e-09, "loss": 1.1479, "step": 36234 }, { "epoch": 0.99, "learning_rate": 5.707660753101474e-09, "loss": 1.325, "step": 36235 }, { "epoch": 0.99, "learning_rate": 5.677819650898863e-09, "loss": 1.1206, "step": 36236 }, { "epoch": 0.99, "learning_rate": 5.64805673957336e-09, "loss": 1.7217, "step": 36237 }, { "epoch": 0.99, "learning_rate": 5.618372019358109e-09, "loss": 1.2932, "step": 36238 }, { "epoch": 0.99, "learning_rate": 5.588765490484038e-09, "loss": 1.2803, "step": 36239 }, { "epoch": 0.99, "learning_rate": 5.559237153185404e-09, "loss": 1.238, "step": 36240 }, { "epoch": 0.99, "learning_rate": 5.529787007689802e-09, "loss": 1.2012, "step": 36241 }, { "epoch": 0.99, "learning_rate": 5.500415054230379e-09, "loss": 1.1733, "step": 36242 }, { "epoch": 0.99, "learning_rate": 5.471121293035841e-09, "loss": 1.1365, "step": 36243 }, { "epoch": 0.99, "learning_rate": 5.441905724336005e-09, "loss": 1.1731, "step": 36244 }, { "epoch": 0.99, "learning_rate": 5.412768348358466e-09, "loss": 1.2998, "step": 36245 }, { "epoch": 0.99, "learning_rate": 5.3837091653308194e-09, "loss": 1.3245, "step": 36246 }, { "epoch": 0.99, "learning_rate": 5.354728175482882e-09, "loss": 1.5044, "step": 36247 }, { "epoch": 0.99, "learning_rate": 5.325825379038918e-09, "loss": 1.114, "step": 36248 }, { "epoch": 0.99, "learning_rate": 5.2970007762254135e-09, "loss": 1.3643, "step": 36249 }, { "epoch": 0.99, "learning_rate": 5.268254367268855e-09, "loss": 1.2327, "step": 36250 }, { "epoch": 0.99, "learning_rate": 5.2395861523935055e-09, "loss": 1.1626, "step": 36251 }, { "epoch": 0.99, "learning_rate": 5.2109961318236316e-09, "loss": 1.2388, "step": 36252 }, { "epoch": 0.99, "learning_rate": 5.182484305783497e-09, "loss": 1.3103, "step": 36253 }, { "epoch": 0.99, "learning_rate": 5.154050674495148e-09, "loss": 1.2954, "step": 36254 }, { "epoch": 0.99, "learning_rate": 5.125695238181738e-09, "loss": 1.2136, "step": 36255 }, { "epoch": 0.99, "learning_rate": 5.097417997065312e-09, "loss": 1.3936, "step": 36256 }, { "epoch": 0.99, "learning_rate": 5.069218951366805e-09, "loss": 1.2668, "step": 36257 }, { "epoch": 0.99, "learning_rate": 5.041098101306041e-09, "loss": 1.3105, "step": 36258 }, { "epoch": 0.99, "learning_rate": 5.013055447103954e-09, "loss": 1.3599, "step": 36259 }, { "epoch": 0.99, "learning_rate": 4.985090988980367e-09, "loss": 1.3162, "step": 36260 }, { "epoch": 0.99, "learning_rate": 4.957204727152887e-09, "loss": 1.3567, "step": 36261 }, { "epoch": 0.99, "learning_rate": 4.929396661841335e-09, "loss": 1.2859, "step": 36262 }, { "epoch": 0.99, "learning_rate": 4.901666793261095e-09, "loss": 1.2854, "step": 36263 }, { "epoch": 0.99, "learning_rate": 4.8740151216297715e-09, "loss": 1.1628, "step": 36264 }, { "epoch": 0.99, "learning_rate": 4.846441647164968e-09, "loss": 1.3325, "step": 36265 }, { "epoch": 0.99, "learning_rate": 4.818946370080957e-09, "loss": 1.3535, "step": 36266 }, { "epoch": 0.99, "learning_rate": 4.791529290594232e-09, "loss": 1.2959, "step": 36267 }, { "epoch": 0.99, "learning_rate": 4.764190408917957e-09, "loss": 1.2659, "step": 36268 }, { "epoch": 0.99, "learning_rate": 4.7369297252664035e-09, "loss": 1.1611, "step": 36269 }, { "epoch": 0.99, "learning_rate": 4.709747239853846e-09, "loss": 1.3218, "step": 36270 }, { "epoch": 0.99, "learning_rate": 4.682642952891225e-09, "loss": 1.1008, "step": 36271 }, { "epoch": 0.99, "learning_rate": 4.655616864591706e-09, "loss": 1.0789, "step": 36272 }, { "epoch": 0.99, "learning_rate": 4.628668975166228e-09, "loss": 1.3215, "step": 36273 }, { "epoch": 0.99, "learning_rate": 4.601799284826847e-09, "loss": 1.1099, "step": 36274 }, { "epoch": 0.99, "learning_rate": 4.575007793782282e-09, "loss": 1.3369, "step": 36275 }, { "epoch": 0.99, "learning_rate": 4.5482945022423675e-09, "loss": 1.4314, "step": 36276 }, { "epoch": 0.99, "learning_rate": 4.521659410416934e-09, "loss": 1.2468, "step": 36277 }, { "epoch": 0.99, "learning_rate": 4.4951025185135945e-09, "loss": 1.2625, "step": 36278 }, { "epoch": 0.99, "learning_rate": 4.468623826739959e-09, "loss": 1.1868, "step": 36279 }, { "epoch": 0.99, "learning_rate": 4.442223335303641e-09, "loss": 1.302, "step": 36280 }, { "epoch": 0.99, "learning_rate": 4.415901044412252e-09, "loss": 1.1377, "step": 36281 }, { "epoch": 0.99, "learning_rate": 4.3896569542689615e-09, "loss": 1.366, "step": 36282 }, { "epoch": 0.99, "learning_rate": 4.363491065082492e-09, "loss": 1.2942, "step": 36283 }, { "epoch": 0.99, "learning_rate": 4.3374033770549054e-09, "loss": 1.208, "step": 36284 }, { "epoch": 0.99, "learning_rate": 4.31139389039048e-09, "loss": 1.2292, "step": 36285 }, { "epoch": 0.99, "learning_rate": 4.2854626052946104e-09, "loss": 1.304, "step": 36286 }, { "epoch": 0.99, "learning_rate": 4.259609521968245e-09, "loss": 1.3271, "step": 36287 }, { "epoch": 0.99, "learning_rate": 4.2338346406145535e-09, "loss": 1.2993, "step": 36288 }, { "epoch": 0.99, "learning_rate": 4.208137961434489e-09, "loss": 1.386, "step": 36289 }, { "epoch": 0.99, "learning_rate": 4.18251948463011e-09, "loss": 1.2114, "step": 36290 }, { "epoch": 0.99, "learning_rate": 4.156979210401257e-09, "loss": 1.0844, "step": 36291 }, { "epoch": 0.99, "learning_rate": 4.131517138947771e-09, "loss": 1.2341, "step": 36292 }, { "epoch": 0.99, "learning_rate": 4.1061332704694925e-09, "loss": 1.2534, "step": 36293 }, { "epoch": 0.99, "learning_rate": 4.08082760516404e-09, "loss": 1.3003, "step": 36294 }, { "epoch": 0.99, "learning_rate": 4.055600143229033e-09, "loss": 1.2539, "step": 36295 }, { "epoch": 0.99, "learning_rate": 4.030450884863202e-09, "loss": 1.1694, "step": 36296 }, { "epoch": 0.99, "learning_rate": 4.005379830263057e-09, "loss": 1.2747, "step": 36297 }, { "epoch": 0.99, "learning_rate": 3.9803869796239955e-09, "loss": 1.0933, "step": 36298 }, { "epoch": 0.99, "learning_rate": 3.9554723331425295e-09, "loss": 1.2795, "step": 36299 }, { "epoch": 0.99, "learning_rate": 3.930635891011836e-09, "loss": 1.2993, "step": 36300 }, { "epoch": 0.99, "learning_rate": 3.905877653428425e-09, "loss": 1.4448, "step": 36301 }, { "epoch": 0.99, "learning_rate": 3.881197620584365e-09, "loss": 1.2983, "step": 36302 }, { "epoch": 0.99, "learning_rate": 3.8565957926728346e-09, "loss": 1.2512, "step": 36303 }, { "epoch": 0.99, "learning_rate": 3.832072169888123e-09, "loss": 1.2461, "step": 36304 }, { "epoch": 0.99, "learning_rate": 3.807626752420079e-09, "loss": 1.0469, "step": 36305 }, { "epoch": 0.99, "learning_rate": 3.783259540459661e-09, "loss": 1.417, "step": 36306 }, { "epoch": 0.99, "learning_rate": 3.758970534200046e-09, "loss": 1.3704, "step": 36307 }, { "epoch": 0.99, "learning_rate": 3.734759733828863e-09, "loss": 1.2327, "step": 36308 }, { "epoch": 0.99, "learning_rate": 3.7106271395359605e-09, "loss": 1.4502, "step": 36309 }, { "epoch": 0.99, "learning_rate": 3.686572751511186e-09, "loss": 1.3467, "step": 36310 }, { "epoch": 0.99, "learning_rate": 3.6625965699421672e-09, "loss": 1.2018, "step": 36311 }, { "epoch": 0.99, "learning_rate": 3.638698595015422e-09, "loss": 1.1411, "step": 36312 }, { "epoch": 0.99, "learning_rate": 3.6148788269196875e-09, "loss": 1.1973, "step": 36313 }, { "epoch": 0.99, "learning_rate": 3.591137265840372e-09, "loss": 1.3647, "step": 36314 }, { "epoch": 0.99, "learning_rate": 3.5674739119639924e-09, "loss": 1.1228, "step": 36315 }, { "epoch": 0.99, "learning_rate": 3.5438887654737355e-09, "loss": 1.1499, "step": 36316 }, { "epoch": 0.99, "learning_rate": 3.5203818265572287e-09, "loss": 1.1394, "step": 36317 }, { "epoch": 0.99, "learning_rate": 3.496953095395439e-09, "loss": 1.1372, "step": 36318 }, { "epoch": 0.99, "learning_rate": 3.473602572172663e-09, "loss": 1.2549, "step": 36319 }, { "epoch": 0.99, "learning_rate": 3.4503302570709774e-09, "loss": 1.2756, "step": 36320 }, { "epoch": 0.99, "learning_rate": 3.4271361502746792e-09, "loss": 1.2825, "step": 36321 }, { "epoch": 0.99, "learning_rate": 3.4040202519636247e-09, "loss": 1.3315, "step": 36322 }, { "epoch": 0.99, "learning_rate": 3.3809825623176694e-09, "loss": 1.3271, "step": 36323 }, { "epoch": 0.99, "learning_rate": 3.358023081518891e-09, "loss": 1.3049, "step": 36324 }, { "epoch": 0.99, "learning_rate": 3.335141809746034e-09, "loss": 1.2847, "step": 36325 }, { "epoch": 0.99, "learning_rate": 3.3123387471789557e-09, "loss": 1.4275, "step": 36326 }, { "epoch": 0.99, "learning_rate": 3.2896138939941813e-09, "loss": 1.2253, "step": 36327 }, { "epoch": 0.99, "learning_rate": 3.2669672503715665e-09, "loss": 1.3147, "step": 36328 }, { "epoch": 0.99, "learning_rate": 3.244398816487637e-09, "loss": 1.2607, "step": 36329 }, { "epoch": 0.99, "learning_rate": 3.2219085925178086e-09, "loss": 1.1133, "step": 36330 }, { "epoch": 0.99, "learning_rate": 3.199496578639716e-09, "loss": 1.4429, "step": 36331 }, { "epoch": 0.99, "learning_rate": 3.1771627750276645e-09, "loss": 1.2593, "step": 36332 }, { "epoch": 0.99, "learning_rate": 3.1549071818559597e-09, "loss": 1.3608, "step": 36333 }, { "epoch": 0.99, "learning_rate": 3.132729799300016e-09, "loss": 1.2922, "step": 36334 }, { "epoch": 0.99, "learning_rate": 3.110630627533029e-09, "loss": 1.0364, "step": 36335 }, { "epoch": 0.99, "learning_rate": 3.0886096667270826e-09, "loss": 1.1113, "step": 36336 }, { "epoch": 0.99, "learning_rate": 3.066666917055372e-09, "loss": 1.3313, "step": 36337 }, { "epoch": 0.99, "learning_rate": 3.0448023786888715e-09, "loss": 1.2617, "step": 36338 }, { "epoch": 0.99, "learning_rate": 3.0230160517996656e-09, "loss": 1.4343, "step": 36339 }, { "epoch": 0.99, "learning_rate": 3.0013079365565077e-09, "loss": 1.0608, "step": 36340 }, { "epoch": 0.99, "learning_rate": 2.979678033130373e-09, "loss": 1.3445, "step": 36341 }, { "epoch": 0.99, "learning_rate": 2.9581263416900154e-09, "loss": 1.7573, "step": 36342 }, { "epoch": 0.99, "learning_rate": 2.9366528624052982e-09, "loss": 1.2207, "step": 36343 }, { "epoch": 0.99, "learning_rate": 2.9152575954427553e-09, "loss": 1.2803, "step": 36344 }, { "epoch": 0.99, "learning_rate": 2.8939405409700305e-09, "loss": 1.3218, "step": 36345 }, { "epoch": 0.99, "learning_rate": 2.8727016991547673e-09, "loss": 1.1643, "step": 36346 }, { "epoch": 0.99, "learning_rate": 2.851541070162389e-09, "loss": 0.9053, "step": 36347 }, { "epoch": 0.99, "learning_rate": 2.830458654158319e-09, "loss": 1.2922, "step": 36348 }, { "epoch": 0.99, "learning_rate": 2.8094544513079804e-09, "loss": 1.3174, "step": 36349 }, { "epoch": 0.99, "learning_rate": 2.7885284617745756e-09, "loss": 1.2117, "step": 36350 }, { "epoch": 0.99, "learning_rate": 2.7676806857235284e-09, "loss": 1.2874, "step": 36351 }, { "epoch": 0.99, "learning_rate": 2.746911123316931e-09, "loss": 1.1858, "step": 36352 }, { "epoch": 0.99, "learning_rate": 2.7262197747179865e-09, "loss": 1.1636, "step": 36353 }, { "epoch": 0.99, "learning_rate": 2.7056066400876766e-09, "loss": 1.3513, "step": 36354 }, { "epoch": 0.99, "learning_rate": 2.6850717195869845e-09, "loss": 1.2891, "step": 36355 }, { "epoch": 0.99, "learning_rate": 2.6646150133780023e-09, "loss": 1.3003, "step": 36356 }, { "epoch": 0.99, "learning_rate": 2.644236521619492e-09, "loss": 1.3989, "step": 36357 }, { "epoch": 0.99, "learning_rate": 2.6239362444713258e-09, "loss": 1.3203, "step": 36358 }, { "epoch": 0.99, "learning_rate": 2.6037141820933752e-09, "loss": 1.2935, "step": 36359 }, { "epoch": 0.99, "learning_rate": 2.5835703346421827e-09, "loss": 1.7222, "step": 36360 }, { "epoch": 0.99, "learning_rate": 2.563504702275399e-09, "loss": 1.2288, "step": 36361 }, { "epoch": 0.99, "learning_rate": 2.5435172851517865e-09, "loss": 1.2969, "step": 36362 }, { "epoch": 0.99, "learning_rate": 2.523608083425666e-09, "loss": 1.2991, "step": 36363 }, { "epoch": 0.99, "learning_rate": 2.5037770972546894e-09, "loss": 1.4075, "step": 36364 }, { "epoch": 0.99, "learning_rate": 2.4840243267920674e-09, "loss": 1.3901, "step": 36365 }, { "epoch": 0.99, "learning_rate": 2.4643497721932306e-09, "loss": 1.2107, "step": 36366 }, { "epoch": 0.99, "learning_rate": 2.4447534336125013e-09, "loss": 1.2229, "step": 36367 }, { "epoch": 0.99, "learning_rate": 2.425235311203089e-09, "loss": 1.2009, "step": 36368 }, { "epoch": 0.99, "learning_rate": 2.405795405117095e-09, "loss": 1.2073, "step": 36369 }, { "epoch": 0.99, "learning_rate": 2.3864337155077298e-09, "loss": 1.3308, "step": 36370 }, { "epoch": 0.99, "learning_rate": 2.367150242524874e-09, "loss": 1.2759, "step": 36371 }, { "epoch": 0.99, "learning_rate": 2.347944986320627e-09, "loss": 1.2209, "step": 36372 }, { "epoch": 0.99, "learning_rate": 2.32881794704376e-09, "loss": 0.9939, "step": 36373 }, { "epoch": 0.99, "learning_rate": 2.309769124846373e-09, "loss": 1.3904, "step": 36374 }, { "epoch": 0.99, "learning_rate": 2.290798519875015e-09, "loss": 1.1587, "step": 36375 }, { "epoch": 0.99, "learning_rate": 2.2719061322795665e-09, "loss": 1.2878, "step": 36376 }, { "epoch": 0.99, "learning_rate": 2.2530919622076873e-09, "loss": 1.0579, "step": 36377 }, { "epoch": 0.99, "learning_rate": 2.2343560098070373e-09, "loss": 1.269, "step": 36378 }, { "epoch": 0.99, "learning_rate": 2.2156982752219445e-09, "loss": 1.188, "step": 36379 }, { "epoch": 0.99, "learning_rate": 2.19711875860118e-09, "loss": 1.4199, "step": 36380 }, { "epoch": 0.99, "learning_rate": 2.178617460087962e-09, "loss": 1.1978, "step": 36381 }, { "epoch": 0.99, "learning_rate": 2.160194379828839e-09, "loss": 1.137, "step": 36382 }, { "epoch": 0.99, "learning_rate": 2.141849517967032e-09, "loss": 1.3723, "step": 36383 }, { "epoch": 0.99, "learning_rate": 2.1235828746457577e-09, "loss": 1.387, "step": 36384 }, { "epoch": 0.99, "learning_rate": 2.1053944500071254e-09, "loss": 1.3394, "step": 36385 }, { "epoch": 0.99, "learning_rate": 2.0872842441965744e-09, "loss": 1.0503, "step": 36386 }, { "epoch": 0.99, "learning_rate": 2.0692522573517728e-09, "loss": 1.2671, "step": 36387 }, { "epoch": 0.99, "learning_rate": 2.0512984896170483e-09, "loss": 1.397, "step": 36388 }, { "epoch": 0.99, "learning_rate": 2.0334229411311803e-09, "loss": 1.2976, "step": 36389 }, { "epoch": 0.99, "learning_rate": 2.015625612035166e-09, "loss": 1.1396, "step": 36390 }, { "epoch": 0.99, "learning_rate": 1.997906502466673e-09, "loss": 1.1768, "step": 36391 }, { "epoch": 0.99, "learning_rate": 1.9802656125655907e-09, "loss": 1.1741, "step": 36392 }, { "epoch": 0.99, "learning_rate": 1.962702942468475e-09, "loss": 1.2822, "step": 36393 }, { "epoch": 0.99, "learning_rate": 1.945218492315215e-09, "loss": 1.2678, "step": 36394 }, { "epoch": 0.99, "learning_rate": 1.9278122622401473e-09, "loss": 1.2539, "step": 36395 }, { "epoch": 0.99, "learning_rate": 1.9104842523809396e-09, "loss": 1.2725, "step": 36396 }, { "epoch": 0.99, "learning_rate": 1.893234462873039e-09, "loss": 1.3938, "step": 36397 }, { "epoch": 0.99, "learning_rate": 1.876062893850783e-09, "loss": 1.3687, "step": 36398 }, { "epoch": 0.99, "learning_rate": 1.8589695454473978e-09, "loss": 1.087, "step": 36399 }, { "epoch": 0.99, "learning_rate": 1.8419544177994407e-09, "loss": 1.231, "step": 36400 }, { "epoch": 0.99, "learning_rate": 1.8250175110390288e-09, "loss": 1.167, "step": 36401 }, { "epoch": 0.99, "learning_rate": 1.8081588252971683e-09, "loss": 1.2935, "step": 36402 }, { "epoch": 0.99, "learning_rate": 1.7913783607070856e-09, "loss": 1.1072, "step": 36403 }, { "epoch": 0.99, "learning_rate": 1.7746761173997873e-09, "loss": 1.2312, "step": 36404 }, { "epoch": 0.99, "learning_rate": 1.7580520955051694e-09, "loss": 1.1443, "step": 36405 }, { "epoch": 0.99, "learning_rate": 1.7415062951553485e-09, "loss": 1.2661, "step": 36406 }, { "epoch": 0.99, "learning_rate": 1.7250387164780002e-09, "loss": 1.218, "step": 36407 }, { "epoch": 0.99, "learning_rate": 1.7086493596019106e-09, "loss": 1.3667, "step": 36408 }, { "epoch": 0.99, "learning_rate": 1.692338224655865e-09, "loss": 1.2839, "step": 36409 }, { "epoch": 0.99, "learning_rate": 1.6761053117686498e-09, "loss": 1.3252, "step": 36410 }, { "epoch": 0.99, "learning_rate": 1.6599506210646099e-09, "loss": 1.3149, "step": 36411 }, { "epoch": 0.99, "learning_rate": 1.6438741526725311e-09, "loss": 1.4133, "step": 36412 }, { "epoch": 0.99, "learning_rate": 1.6278759067167582e-09, "loss": 1.3467, "step": 36413 }, { "epoch": 0.99, "learning_rate": 1.6119558833227466e-09, "loss": 1.3762, "step": 36414 }, { "epoch": 0.99, "learning_rate": 1.5961140826159516e-09, "loss": 1.2324, "step": 36415 }, { "epoch": 0.99, "learning_rate": 1.5803505047184975e-09, "loss": 1.6592, "step": 36416 }, { "epoch": 0.99, "learning_rate": 1.5646651497558397e-09, "loss": 1.1072, "step": 36417 }, { "epoch": 0.99, "learning_rate": 1.5490580178489922e-09, "loss": 1.1208, "step": 36418 }, { "epoch": 0.99, "learning_rate": 1.5335291091211902e-09, "loss": 1.1746, "step": 36419 }, { "epoch": 0.99, "learning_rate": 1.5180784236923374e-09, "loss": 1.1375, "step": 36420 }, { "epoch": 0.99, "learning_rate": 1.5027059616856686e-09, "loss": 1.1675, "step": 36421 }, { "epoch": 0.99, "learning_rate": 1.4874117232199781e-09, "loss": 1.1885, "step": 36422 }, { "epoch": 0.99, "learning_rate": 1.4721957084151694e-09, "loss": 1.2183, "step": 36423 }, { "epoch": 0.99, "learning_rate": 1.4570579173900367e-09, "loss": 1.0977, "step": 36424 }, { "epoch": 0.99, "learning_rate": 1.441998350263374e-09, "loss": 1.345, "step": 36425 }, { "epoch": 0.99, "learning_rate": 1.4270170071517541e-09, "loss": 1.2754, "step": 36426 }, { "epoch": 0.99, "learning_rate": 1.4121138881750817e-09, "loss": 1.3599, "step": 36427 }, { "epoch": 0.99, "learning_rate": 1.3972889934477096e-09, "loss": 1.3186, "step": 36428 }, { "epoch": 0.99, "learning_rate": 1.3825423230862111e-09, "loss": 1.2168, "step": 36429 }, { "epoch": 0.99, "learning_rate": 1.3678738772060495e-09, "loss": 1.27, "step": 36430 }, { "epoch": 0.99, "learning_rate": 1.353283655922688e-09, "loss": 1.2803, "step": 36431 }, { "epoch": 0.99, "learning_rate": 1.338771659348259e-09, "loss": 1.0564, "step": 36432 }, { "epoch": 0.99, "learning_rate": 1.324337887598226e-09, "loss": 1.7876, "step": 36433 }, { "epoch": 0.99, "learning_rate": 1.3099823407847212e-09, "loss": 1.3132, "step": 36434 }, { "epoch": 1.0, "learning_rate": 1.2957050190209875e-09, "loss": 1.3018, "step": 36435 }, { "epoch": 1.0, "learning_rate": 1.2815059224169368e-09, "loss": 1.366, "step": 36436 }, { "epoch": 1.0, "learning_rate": 1.267385051084702e-09, "loss": 1.3706, "step": 36437 }, { "epoch": 1.0, "learning_rate": 1.2533424051353048e-09, "loss": 1.4915, "step": 36438 }, { "epoch": 1.0, "learning_rate": 1.2393779846775478e-09, "loss": 1.0366, "step": 36439 }, { "epoch": 1.0, "learning_rate": 1.2254917898213426e-09, "loss": 1.1343, "step": 36440 }, { "epoch": 1.0, "learning_rate": 1.2116838206754912e-09, "loss": 1.2012, "step": 36441 }, { "epoch": 1.0, "learning_rate": 1.1979540773465747e-09, "loss": 1.2776, "step": 36442 }, { "epoch": 1.0, "learning_rate": 1.1843025599445057e-09, "loss": 1.1724, "step": 36443 }, { "epoch": 1.0, "learning_rate": 1.170729268573645e-09, "loss": 1.2598, "step": 36444 }, { "epoch": 1.0, "learning_rate": 1.157234203341684e-09, "loss": 1.1917, "step": 36445 }, { "epoch": 1.0, "learning_rate": 1.143817364354094e-09, "loss": 1.2827, "step": 36446 }, { "epoch": 1.0, "learning_rate": 1.1304787517141259e-09, "loss": 1.3167, "step": 36447 }, { "epoch": 1.0, "learning_rate": 1.1172183655283608e-09, "loss": 1.3193, "step": 36448 }, { "epoch": 1.0, "learning_rate": 1.1040362059000498e-09, "loss": 1.3215, "step": 36449 }, { "epoch": 1.0, "learning_rate": 1.0909322729313331e-09, "loss": 1.2729, "step": 36450 }, { "epoch": 1.0, "learning_rate": 1.0779065667254617e-09, "loss": 1.2664, "step": 36451 }, { "epoch": 1.0, "learning_rate": 1.0649590873845762e-09, "loss": 1.137, "step": 36452 }, { "epoch": 1.0, "learning_rate": 1.0520898350097064e-09, "loss": 1.3623, "step": 36453 }, { "epoch": 1.0, "learning_rate": 1.0392988097007728e-09, "loss": 1.2544, "step": 36454 }, { "epoch": 1.0, "learning_rate": 1.0265860115588056e-09, "loss": 1.2954, "step": 36455 }, { "epoch": 1.0, "learning_rate": 1.0139514406837247e-09, "loss": 1.2517, "step": 36456 }, { "epoch": 1.0, "learning_rate": 1.00139509717323e-09, "loss": 1.3118, "step": 36457 }, { "epoch": 1.0, "learning_rate": 9.88916981125021e-10, "loss": 1.2356, "step": 36458 }, { "epoch": 1.0, "learning_rate": 9.765170926390177e-10, "loss": 1.302, "step": 36459 }, { "epoch": 1.0, "learning_rate": 9.641954318095893e-10, "loss": 1.095, "step": 36460 }, { "epoch": 1.0, "learning_rate": 9.519519987355453e-10, "loss": 1.3882, "step": 36461 }, { "epoch": 1.0, "learning_rate": 9.397867935112548e-10, "loss": 1.4497, "step": 36462 }, { "epoch": 1.0, "learning_rate": 9.276998162310868e-10, "loss": 1.3247, "step": 36463 }, { "epoch": 1.0, "learning_rate": 9.156910669916308e-10, "loss": 1.4175, "step": 36464 }, { "epoch": 1.0, "learning_rate": 9.037605458861454e-10, "loss": 1.3767, "step": 36465 }, { "epoch": 1.0, "learning_rate": 8.919082530078893e-10, "loss": 1.1758, "step": 36466 }, { "epoch": 1.0, "learning_rate": 8.801341884490111e-10, "loss": 1.176, "step": 36467 }, { "epoch": 1.0, "learning_rate": 8.684383523016593e-10, "loss": 1.1616, "step": 36468 }, { "epoch": 1.0, "learning_rate": 8.568207446579824e-10, "loss": 1.3787, "step": 36469 }, { "epoch": 1.0, "learning_rate": 8.452813656090186e-10, "loss": 1.3623, "step": 36470 }, { "epoch": 1.0, "learning_rate": 8.338202152446961e-10, "loss": 1.3037, "step": 36471 }, { "epoch": 1.0, "learning_rate": 8.224372936538328e-10, "loss": 1.1826, "step": 36472 }, { "epoch": 1.0, "learning_rate": 8.111326009263564e-10, "loss": 1.0973, "step": 36473 }, { "epoch": 1.0, "learning_rate": 7.999061371510852e-10, "loss": 1.207, "step": 36474 }, { "epoch": 1.0, "learning_rate": 7.887579024157266e-10, "loss": 1.1548, "step": 36475 }, { "epoch": 1.0, "learning_rate": 7.77687896806878e-10, "loss": 1.2434, "step": 36476 }, { "epoch": 1.0, "learning_rate": 7.666961204111367e-10, "loss": 1.2712, "step": 36477 }, { "epoch": 1.0, "learning_rate": 7.557825733151003e-10, "loss": 1.3613, "step": 36478 }, { "epoch": 1.0, "learning_rate": 7.449472556031456e-10, "loss": 1.3154, "step": 36479 }, { "epoch": 1.0, "learning_rate": 7.341901673618701e-10, "loss": 1.3008, "step": 36480 }, { "epoch": 1.0, "learning_rate": 7.235113086734302e-10, "loss": 1.1453, "step": 36481 }, { "epoch": 1.0, "learning_rate": 7.129106796222029e-10, "loss": 1.3511, "step": 36482 }, { "epoch": 1.0, "learning_rate": 7.02388280291455e-10, "loss": 1.1975, "step": 36483 }, { "epoch": 1.0, "learning_rate": 6.919441107633428e-10, "loss": 1.2458, "step": 36484 }, { "epoch": 1.0, "learning_rate": 6.815781711200231e-10, "loss": 1.3232, "step": 36485 }, { "epoch": 1.0, "learning_rate": 6.712904614414317e-10, "loss": 1.3503, "step": 36486 }, { "epoch": 1.0, "learning_rate": 6.61080981808615e-10, "loss": 1.314, "step": 36487 }, { "epoch": 1.0, "learning_rate": 6.50949732301509e-10, "loss": 1.2888, "step": 36488 }, { "epoch": 1.0, "learning_rate": 6.408967129989396e-10, "loss": 1.3599, "step": 36489 }, { "epoch": 1.0, "learning_rate": 6.309219239797326e-10, "loss": 1.1238, "step": 36490 }, { "epoch": 1.0, "learning_rate": 6.210253653227139e-10, "loss": 1.1537, "step": 36491 }, { "epoch": 1.0, "learning_rate": 6.112070371055989e-10, "loss": 1.094, "step": 36492 }, { "epoch": 1.0, "learning_rate": 6.014669394027728e-10, "loss": 1.2402, "step": 36493 }, { "epoch": 1.0, "learning_rate": 5.918050722930613e-10, "loss": 1.2009, "step": 36494 }, { "epoch": 1.0, "learning_rate": 5.822214358508493e-10, "loss": 1.2797, "step": 36495 }, { "epoch": 1.0, "learning_rate": 5.727160301516321e-10, "loss": 1.1826, "step": 36496 }, { "epoch": 1.0, "learning_rate": 5.632888552686844e-10, "loss": 1.167, "step": 36497 }, { "epoch": 1.0, "learning_rate": 5.53939911276391e-10, "loss": 1.4243, "step": 36498 }, { "epoch": 1.0, "learning_rate": 5.44669198249137e-10, "loss": 1.219, "step": 36499 }, { "epoch": 1.0, "learning_rate": 5.354767162568663e-10, "loss": 1.147, "step": 36500 }, { "epoch": 1.0, "learning_rate": 5.263624653739641e-10, "loss": 1.3525, "step": 36501 }, { "epoch": 1.0, "learning_rate": 5.173264456703742e-10, "loss": 1.2966, "step": 36502 }, { "epoch": 1.0, "learning_rate": 5.083686572171509e-10, "loss": 1.2737, "step": 36503 }, { "epoch": 1.0, "learning_rate": 4.994891000842383e-10, "loss": 1.2351, "step": 36504 }, { "epoch": 1.0, "learning_rate": 4.906877743415806e-10, "loss": 1.1553, "step": 36505 }, { "epoch": 1.0, "learning_rate": 4.819646800580113e-10, "loss": 1.2219, "step": 36506 }, { "epoch": 1.0, "learning_rate": 4.733198173001441e-10, "loss": 1.291, "step": 36507 }, { "epoch": 1.0, "learning_rate": 4.6475318613792284e-10, "loss": 1.2683, "step": 36508 }, { "epoch": 1.0, "learning_rate": 4.56264786637961e-10, "loss": 1.3735, "step": 36509 }, { "epoch": 1.0, "learning_rate": 4.4785461886465156e-10, "loss": 1.2798, "step": 36510 }, { "epoch": 1.0, "learning_rate": 4.39522682885718e-10, "loss": 1.0898, "step": 36511 }, { "epoch": 1.0, "learning_rate": 4.312689787655533e-10, "loss": 1.1121, "step": 36512 }, { "epoch": 1.0, "learning_rate": 4.2309350656966065e-10, "loss": 1.2603, "step": 36513 }, { "epoch": 1.0, "learning_rate": 4.1499626636132275e-10, "loss": 1.1611, "step": 36514 }, { "epoch": 1.0, "learning_rate": 4.069772582038223e-10, "loss": 1.217, "step": 36515 }, { "epoch": 1.0, "learning_rate": 3.9903648215933176e-10, "loss": 1.1523, "step": 36516 }, { "epoch": 1.0, "learning_rate": 3.911739382911339e-10, "loss": 1.2981, "step": 36517 }, { "epoch": 1.0, "learning_rate": 3.83389626660291e-10, "loss": 1.322, "step": 36518 }, { "epoch": 1.0, "learning_rate": 3.756835473278653e-10, "loss": 1.2927, "step": 36519 }, { "epoch": 1.0, "learning_rate": 3.6805570035380877e-10, "loss": 1.1299, "step": 36520 }, { "epoch": 1.0, "learning_rate": 3.6050608579807354e-10, "loss": 1.3071, "step": 36521 }, { "epoch": 1.0, "learning_rate": 3.530347037183912e-10, "loss": 1.3242, "step": 36522 }, { "epoch": 1.0, "learning_rate": 3.45641554175824e-10, "loss": 1.3101, "step": 36523 }, { "epoch": 1.0, "learning_rate": 3.383266372258831e-10, "loss": 1.3381, "step": 36524 }, { "epoch": 1.0, "learning_rate": 3.310899529274103e-10, "loss": 1.1597, "step": 36525 }, { "epoch": 1.0, "learning_rate": 3.239315013359168e-10, "loss": 1.2531, "step": 36526 }, { "epoch": 1.0, "learning_rate": 3.168512825080239e-10, "loss": 1.2115, "step": 36527 }, { "epoch": 1.0, "learning_rate": 3.0984929649924277e-10, "loss": 1.2502, "step": 36528 }, { "epoch": 1.0, "learning_rate": 3.0292554336286415e-10, "loss": 1.28, "step": 36529 }, { "epoch": 1.0, "learning_rate": 2.9608002315550943e-10, "loss": 1.23, "step": 36530 }, { "epoch": 1.0, "learning_rate": 2.8931273592824884e-10, "loss": 1.2627, "step": 36531 }, { "epoch": 1.0, "learning_rate": 2.8262368173548325e-10, "loss": 1.1267, "step": 36532 }, { "epoch": 1.0, "learning_rate": 2.7601286063050346e-10, "loss": 1.1418, "step": 36533 }, { "epoch": 1.0, "learning_rate": 2.6948027266215925e-10, "loss": 1.1135, "step": 36534 }, { "epoch": 1.0, "learning_rate": 2.630259178837413e-10, "loss": 1.5928, "step": 36535 }, { "epoch": 1.0, "learning_rate": 2.566497963452097e-10, "loss": 1.2573, "step": 36536 }, { "epoch": 1.0, "learning_rate": 2.5035190809763467e-10, "loss": 1.3647, "step": 36537 }, { "epoch": 1.0, "learning_rate": 2.4413225318764555e-10, "loss": 1.1982, "step": 36538 }, { "epoch": 1.0, "learning_rate": 2.379908316652024e-10, "loss": 1.3511, "step": 36539 }, { "epoch": 1.0, "learning_rate": 2.319276435791551e-10, "loss": 1.4004, "step": 36540 }, { "epoch": 1.0, "learning_rate": 2.259426889761329e-10, "loss": 1.3091, "step": 36541 }, { "epoch": 1.0, "learning_rate": 2.2003596790387548e-10, "loss": 1.1421, "step": 36542 }, { "epoch": 1.0, "learning_rate": 2.1420748040679173e-10, "loss": 1.2101, "step": 36543 }, { "epoch": 1.0, "learning_rate": 2.0845722653151101e-10, "loss": 1.3887, "step": 36544 }, { "epoch": 1.0, "learning_rate": 2.0278520632355246e-10, "loss": 1.4119, "step": 36545 }, { "epoch": 1.0, "learning_rate": 1.9719141982621482e-10, "loss": 1.0167, "step": 36546 }, { "epoch": 1.0, "learning_rate": 1.9167586708501719e-10, "loss": 1.2769, "step": 36547 }, { "epoch": 1.0, "learning_rate": 1.8623854814103782e-10, "loss": 1.2695, "step": 36548 }, { "epoch": 1.0, "learning_rate": 1.808794630375754e-10, "loss": 1.2351, "step": 36549 }, { "epoch": 1.0, "learning_rate": 1.7559861181681847e-10, "loss": 1.3577, "step": 36550 }, { "epoch": 1.0, "learning_rate": 1.7039599451984523e-10, "loss": 1.3118, "step": 36551 }, { "epoch": 1.0, "learning_rate": 1.6527161118773393e-10, "loss": 1.4392, "step": 36552 }, { "epoch": 1.0, "learning_rate": 1.602254618593424e-10, "loss": 1.2632, "step": 36553 }, { "epoch": 1.0, "learning_rate": 1.5525754657574886e-10, "loss": 1.2021, "step": 36554 }, { "epoch": 1.0, "learning_rate": 1.5036786537581115e-10, "loss": 1.2983, "step": 36555 }, { "epoch": 1.0, "learning_rate": 1.4555641829616662e-10, "loss": 1.1428, "step": 36556 }, { "epoch": 1.0, "learning_rate": 1.4082320537567306e-10, "loss": 1.1377, "step": 36557 }, { "epoch": 1.0, "learning_rate": 1.3616822665096786e-10, "loss": 1.4275, "step": 36558 }, { "epoch": 1.0, "learning_rate": 1.3159148215979855e-10, "loss": 1.2483, "step": 36559 }, { "epoch": 1.0, "learning_rate": 1.2709297193547188e-10, "loss": 1.4014, "step": 36560 }, { "epoch": 1.0, "learning_rate": 1.2267269601462518e-10, "loss": 1.3401, "step": 36561 }, { "epoch": 1.0, "learning_rate": 1.1833065443278557e-10, "loss": 1.2617, "step": 36562 }, { "epoch": 1.0, "learning_rate": 1.1406684722214956e-10, "loss": 1.2539, "step": 36563 }, { "epoch": 1.0, "learning_rate": 1.098812744160238e-10, "loss": 1.2966, "step": 36564 }, { "epoch": 1.0, "learning_rate": 1.0577393604882524e-10, "loss": 1.3201, "step": 36565 }, { "epoch": 1.0, "learning_rate": 1.0174483215164011e-10, "loss": 1.1035, "step": 36566 }, { "epoch": 1.0, "learning_rate": 9.779396275555463e-11, "loss": 1.2068, "step": 36567 }, { "epoch": 1.0, "learning_rate": 9.392132789276531e-11, "loss": 1.272, "step": 36568 }, { "epoch": 1.0, "learning_rate": 9.012692759213792e-11, "loss": 1.6357, "step": 36569 }, { "epoch": 1.0, "learning_rate": 8.641076188475872e-11, "loss": 1.3926, "step": 36570 }, { "epoch": 1.0, "learning_rate": 8.277283079838327e-11, "loss": 1.2578, "step": 36571 }, { "epoch": 1.0, "learning_rate": 7.921313436298761e-11, "loss": 1.3965, "step": 36572 }, { "epoch": 1.0, "learning_rate": 7.573167260521708e-11, "loss": 1.2556, "step": 36573 }, { "epoch": 1.0, "learning_rate": 7.232844555282725e-11, "loss": 1.2705, "step": 36574 }, { "epoch": 1.0, "learning_rate": 6.900345323135327e-11, "loss": 1.2058, "step": 36575 }, { "epoch": 1.0, "learning_rate": 6.57566956685507e-11, "loss": 1.3169, "step": 36576 }, { "epoch": 1.0, "learning_rate": 6.258817288773422e-11, "loss": 1.2, "step": 36577 }, { "epoch": 1.0, "learning_rate": 5.949788491665942e-11, "loss": 1.2285, "step": 36578 }, { "epoch": 1.0, "learning_rate": 5.648583177642053e-11, "loss": 1.2935, "step": 36579 }, { "epoch": 1.0, "learning_rate": 5.355201349255268e-11, "loss": 1.666, "step": 36580 }, { "epoch": 1.0, "learning_rate": 5.069643008726033e-11, "loss": 1.1467, "step": 36581 }, { "epoch": 1.0, "learning_rate": 4.791908158274794e-11, "loss": 1.2483, "step": 36582 }, { "epoch": 1.0, "learning_rate": 4.521996800121997e-11, "loss": 1.1934, "step": 36583 }, { "epoch": 1.0, "learning_rate": 4.2599089363770663e-11, "loss": 1.3149, "step": 36584 }, { "epoch": 1.0, "learning_rate": 4.005644569038403e-11, "loss": 1.135, "step": 36585 }, { "epoch": 1.0, "learning_rate": 3.7592037002154304e-11, "loss": 1.2461, "step": 36586 }, { "epoch": 1.0, "learning_rate": 3.5205863316845055e-11, "loss": 1.2585, "step": 36587 }, { "epoch": 1.0, "learning_rate": 3.289792465333008e-11, "loss": 1.2236, "step": 36588 }, { "epoch": 1.0, "learning_rate": 3.066822103048317e-11, "loss": 1.3218, "step": 36589 }, { "epoch": 1.0, "learning_rate": 2.8516752466067886e-11, "loss": 1.2888, "step": 36590 }, { "epoch": 1.0, "learning_rate": 2.644351897562736e-11, "loss": 1.3545, "step": 36591 }, { "epoch": 1.0, "learning_rate": 2.4448520575814928e-11, "loss": 1.6929, "step": 36592 }, { "epoch": 1.0, "learning_rate": 2.2531757282173717e-11, "loss": 1.2512, "step": 36593 }, { "epoch": 1.0, "learning_rate": 2.069322911024685e-11, "loss": 1.0764, "step": 36594 }, { "epoch": 1.0, "learning_rate": 1.8932936074467223e-11, "loss": 1.2615, "step": 36595 }, { "epoch": 1.0, "learning_rate": 1.7250878187047293e-11, "loss": 1.2166, "step": 36596 }, { "epoch": 1.0, "learning_rate": 1.564705546353018e-11, "loss": 1.2815, "step": 36597 }, { "epoch": 1.0, "learning_rate": 1.4121467915018116e-11, "loss": 1.1255, "step": 36598 }, { "epoch": 1.0, "learning_rate": 1.2674115553723554e-11, "loss": 1.199, "step": 36599 }, { "epoch": 1.0, "learning_rate": 1.1304998390748722e-11, "loss": 1.2104, "step": 36600 }, { "epoch": 1.0, "learning_rate": 1.0014116437195853e-11, "loss": 1.3345, "step": 36601 }, { "epoch": 1.0, "learning_rate": 8.80146970194673e-12, "loss": 1.2747, "step": 36602 }, { "epoch": 1.0, "learning_rate": 7.667058197213806e-12, "loss": 1.1398, "step": 36603 }, { "epoch": 1.0, "learning_rate": 6.6108819285481966e-12, "loss": 1.2744, "step": 36604 }, { "epoch": 1.0, "learning_rate": 5.632940907052131e-12, "loss": 1.0815, "step": 36605 }, { "epoch": 1.0, "learning_rate": 4.733235138276726e-12, "loss": 1.3191, "step": 36606 }, { "epoch": 1.0, "learning_rate": 3.911764631103765e-12, "loss": 1.1958, "step": 36607 }, { "epoch": 1.0, "learning_rate": 3.1685293899741397e-12, "loss": 1.092, "step": 36608 }, { "epoch": 1.0, "learning_rate": 2.503529422659412e-12, "loss": 1.2971, "step": 36609 }, { "epoch": 1.0, "learning_rate": 1.9167647324902504e-12, "loss": 1.3027, "step": 36610 }, { "epoch": 1.0, "learning_rate": 1.4082353261279934e-12, "loss": 1.4199, "step": 36611 }, { "epoch": 1.0, "learning_rate": 9.77941205793087e-13, "loss": 1.2273, "step": 36612 }, { "epoch": 1.0, "learning_rate": 6.258823748162002e-13, "loss": 1.2344, "step": 36613 }, { "epoch": 1.0, "learning_rate": 3.52058837638225e-13, "loss": 1.2212, "step": 36614 }, { "epoch": 1.0, "learning_rate": 1.5647059536938457e-13, "loss": 1.3315, "step": 36615 }, { "epoch": 1.0, "learning_rate": 3.91176491199019e-14, "loss": 1.2566, "step": 36616 }, { "epoch": 1.0, "learning_rate": 0.0, "loss": 1.2429, "step": 36617 }, { "epoch": 1.0, "step": 36617, "total_flos": 2449966641025024.0, "train_loss": 1.346002999772001, "train_runtime": 225227.5981, "train_samples_per_second": 15.608, "train_steps_per_second": 0.163 } ], "max_steps": 36617, "num_train_epochs": 1, "total_flos": 2449966641025024.0, "trial_name": null, "trial_params": null }